Skip to content

Commit

Permalink
changing config for fp8 gemm
Browse files Browse the repository at this point in the history
Summary:
X-link: facebookresearch/FBGEMM#746

testing for now

Differential Revision: D69322680
  • Loading branch information
adamomainz authored and facebook-github-bot committed Feb 7, 2025
1 parent 2cef43a commit 986622b
Showing 1 changed file with 34 additions and 2 deletions.
36 changes: 34 additions & 2 deletions fbgemm_gpu/experimental/gemm/triton_gemm/fp8_gemm.py
Original file line number Diff line number Diff line change
Expand Up @@ -2988,7 +2988,7 @@ def get_full_non_persistent_tuning_space():
# For now we see better perf with num_stages=0 for all gemm configs we care
# But keep this explicit so that we do not forget we may need to set it to
# other values in the future
num_stage_range = [0]
num_stage_range = [2]
waves_per_eu_range = [0]
matrix_instr_nonkdim_range = [16, 32]
kpack_range = [1, 2]
Expand Down Expand Up @@ -3025,7 +3025,39 @@ def get_full_non_persistent_tuning_space():
return configs


MATMUL_CONFIGS_NON_PERSISTENT: List[Config] = get_full_non_persistent_tuning_space()
MATMUL_CONFIGS_NON_PERSISTENT_4_8K_16K = [
triton.Config(
{
"BLOCK_M": 16,
"BLOCK_N": 16,
"BLOCK_K": 256,
"GROUP_M": 1,
"SPLIT_K": 1,
"waves_per_eu": 8,
"matrix_instr_nonkdim": 16,
"kpack": 2,
},
num_warps=2,
num_stages=2,
),
triton.Config(
{
"BLOCK_M": 16,
"BLOCK_N": 16,
"BLOCK_K": 256,
"GROUP_M": 1,
"SPLIT_K": 1,
"waves_per_eu": 0,
"matrix_instr_nonkdim": 16,
"kpack": 2,
},
num_warps=2,
num_stages=2,
),
]

# MATMUL_CONFIGS_NON_PERSISTENT: List[Config] = get_full_non_persistent_tuning_space()
MATMUL_CONFIGS_NON_PERSISTENT = MATMUL_CONFIGS_NON_PERSISTENT_4_8K_16K


@triton.autotune(
Expand Down

0 comments on commit 986622b

Please sign in to comment.