diff --git a/python/sglang/srt/models/llama4.py b/python/sglang/srt/models/llama4.py index 265a9391d8cf..75d4a2a29977 100644 --- a/python/sglang/srt/models/llama4.py +++ b/python/sglang/srt/models/llama4.py @@ -406,6 +406,8 @@ def __init__( ) def _is_moe_layer(self, layer_id: int) -> bool: + if self.config.interleave_moe_layer_step == 0: + return self.config.num_local_experts > 0 return (layer_id + 1) % self.config.interleave_moe_layer_step == 0 def forward(