Change the order of the checks

gshtras · mgoin · gshtras · commit f3da1920d909 · 2025-02-18T17:35:04.000Z
Co-authored-by: Michael Goin &lt;mgoin64@gmail.com&gt;
Signed-off-by: Gregory Shtrasberg &lt;Gregory.Shtrasberg@amd.com&gt;
diff --git a/vllm/model_executor/layers/quantization/fp8.py b/vllm/model_executor/layers/quantization/fp8.py
@@ -252,7 +252,7 @@ def create_weights(
     def add_padding_to_weight(self, weight: torch.Tensor) -> torch.Tensor:
         # Pad the weight tensor. This is an optimization on ROCm platform, which
         # can benefit from tensors located far enough from one another in memory
-        if (current_platform.is_rocm() and envs.VLLM_ROCM_FP8_PADDING
+        if (envs.VLLM_ROCM_FP8_PADDING and current_platform.is_rocm()
                 and weight.stride(-1) == 1
                 and (weight.stride(-2) * weight.element_size()) % 512 == 0):
             num_pad = 256 // weight.element_size()