Skip to content

Commit 2303d8f

Browse files
committed
add 1 more test config to test renormNaive
Signed-off-by: jiahanc <[email protected]>
1 parent 2e2c370 commit 2303d8f

File tree

2 files changed

+17
-1
lines changed

2 files changed

+17
-1
lines changed

flashinfer/fused_moe/core.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -178,7 +178,8 @@ class GatedActType(IntEnum):
178178
GeGlu = 1
179179

180180

181-
def is_flashinfer_trtllm_moe_supported(
181+
@functools.cache
182+
def is_trtllm_moe_supported(
182183
dtype_weights: DtypeTrtllmGen,
183184
dtype_act: DtypeTrtllmGen,
184185
quant_method: Optional[str] = None,

tests/moe/test_trtllm_gen_fused_moe.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2296,6 +2296,21 @@ def run_moe_test(
22962296
"compatible_moe_impls": [FP8BlockScaleMoe, FP4Moe, BF16Moe],
22972297
"compatible_intermediate_size": [384, 768, 1024],
22982298
},
2299+
id="Qwen3",
2300+
),
2301+
pytest.param(
2302+
{
2303+
"num_experts": 256,
2304+
"top_k": 8,
2305+
"padding": 8,
2306+
"n_groups": None,
2307+
"top_k_groups": None,
2308+
"routed_scaling": None,
2309+
"has_routing_bias": False,
2310+
"routing_method_type": RoutingMethodType.RenormalizeNaive,
2311+
"compatible_moe_impls": [FP8BlockScaleMoe, FP4Moe, BF16Moe],
2312+
"compatible_intermediate_size": [384, 1024],
2313+
},
22992314
id="Renorm",
23002315
),
23012316
pytest.param(

0 commit comments

Comments
 (0)