Skip to content

Commit 35d9db3

Browse files
committed
post rebase fixup
Signed-off-by: Anthony Chang <[email protected]>
1 parent ad1f673 commit 35d9db3

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

tensorrt_llm/_torch/modules/fused_moe/fused_moe_trtllm_gen.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -285,7 +285,7 @@ def _quantize_for_post_quant_comm(self, x):
285285
False)
286286
elif self.has_w4a8_mxfp4_mxfp8:
287287
x, x_sf = torch.ops.trtllm.mxfp8_quantize(
288-
x, False, alignment=self.quant_method.weight_alignment)
288+
x, False, alignment=self.quant_method.input_hidden_alignment)
289289
x_row, x_col = x.shape[0], x.shape[1]
290290
elif self.has_deepseek_fp8_block_scales:
291291
# No change required before communication

tests/unittest/_torch/thop/parallel/test_moe.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1806,10 +1806,10 @@ def test_moe_fp8_per_tensor_scale(num_tokens, hidden_size, intermediate_size,
18061806
tile_tokens_dim)
18071807
elif routing_method_type == RoutingMethodType.Renormalize:
18081808
permute_info, scores = routing_reference_renormalize(
1809-
expert_logits, top_k, num_experts, tile_tokens_dim)
1809+
expert_logits, top_k, tile_tokens_dim)
18101810
elif routing_method_type == RoutingMethodType.RenormalizeNaive:
18111811
permute_info, scores = routing_reference_renormalize_naive(
1812-
expert_logits, top_k, num_experts, tile_tokens_dim)
1812+
expert_logits, top_k, tile_tokens_dim)
18131813
elif routing_method_type == RoutingMethodType.Llama4:
18141814
permute_info, scores = routing_reference_no_aux(
18151815
expert_logits, routing_bias, top_k, n_groups, top_k_groups,

0 commit comments

Comments
 (0)