We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent a0592c0 commit b532a5fCopy full SHA for b532a5f
1 file changed
python/sglang/srt/layers/ep_moe/layer.py
@@ -644,6 +644,10 @@ def process_weights_after_loading(self, layer: Module) -> None:
644
"QuantConfig has static quantization, but found "
645
"activation scales are None."
646
)
647
+ layer.w13_weight_scale = torch.nn.Parameter(
648
+ torch.max(layer.w13_weight_scale, dim=1).values,
649
+ requires_grad=False,
650
+ )
651
return
652
653
def apply(
0 commit comments