We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0bfcc77 commit 074b15aCopy full SHA for 074b15a
fbgemm_gpu/experimental/gemm/triton_gemm/fp8_gemm.py
@@ -2876,7 +2876,7 @@ def get_full_non_persistent_tuning_space():
2876
# For now we see better perf with num_stages=0 for all gemm configs we care
2877
# But keep this explicit so that we do not forget we may need to set it to
2878
# other values in the future
2879
- num_stage_range = [0]
+ num_stage_range = [2]
2880
waves_per_eu_range = [0]
2881
matrix_instr_nonkdim_range = [16, 32]
2882
kpack_range = [1, 2]
0 commit comments