File tree Expand file tree Collapse file tree 1 file changed +30
-2
lines changed
fbgemm_gpu/experimental/gemm/triton_gemm Expand file tree Collapse file tree 1 file changed +30
-2
lines changed Original file line number Diff line number Diff line change @@ -3868,6 +3868,20 @@ def get_full_non_persistent_tuning_space():
3868
3868
num_warps = 8 ,
3869
3869
num_stages = 2 ,
3870
3870
),
3871
+ triton .Config (
3872
+ {
3873
+ "BLOCK_M" : 256 ,
3874
+ "BLOCK_N" : 256 ,
3875
+ "BLOCK_K" : 128 ,
3876
+ "GROUP_M" : 2 ,
3877
+ "SPLIT_K" : 1 ,
3878
+ "waves_per_eu" : 0 ,
3879
+ "matrix_instr_nonkdim" : 16 ,
3880
+ "kpack" : 1 ,
3881
+ },
3882
+ num_warps = 8 ,
3883
+ num_stages = 2 ,
3884
+ ),
3871
3885
triton .Config (
3872
3886
{
3873
3887
"BLOCK_M" : 256 ,
@@ -3876,12 +3890,26 @@ def get_full_non_persistent_tuning_space():
3876
3890
"GROUP_M" : 2 ,
3877
3891
"SPLIT_K" : 1 ,
3878
3892
"waves_per_eu" : 2 ,
3879
- "matrix_instr_nonkdim" : 32 ,
3880
- "kpack" : 2 ,
3893
+ "matrix_instr_nonkdim" : 16 ,
3894
+ "kpack" : 1 ,
3881
3895
},
3882
3896
num_warps = 8 ,
3883
3897
num_stages = 2 ,
3884
3898
),
3899
+ triton .Config (
3900
+ {
3901
+ "BLOCK_M" : 128 ,
3902
+ "BLOCK_N" : 256 ,
3903
+ "BLOCK_K" : 64 ,
3904
+ "GROUP_M" : 2 ,
3905
+ "SPLIT_K" : 1 ,
3906
+ "waves_per_eu" : 2 ,
3907
+ "matrix_instr_nonkdim" : 16 ,
3908
+ "kpack" : 1 ,
3909
+ },
3910
+ num_warps = 4 ,
3911
+ num_stages = 2 ,
3912
+ ),
3885
3913
triton .Config (
3886
3914
{
3887
3915
"BLOCK_M" : 256 ,
You can’t perform that action at this time.
0 commit comments