[CI/Build] Update checking logic in cutlass_group_gemm_supported (vllm-project#27948)

zhewenl · devpatelio · commit 33a4498dc92c · 2025-11-28T16:30:28.000-08:00
Signed-off-by: zhewenli &lt;zhewenli@meta.com&gt;
diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py
@@ -836,7 +836,11 @@ def cutlass_sparse_scaled_mm_supported(cuda_device_capability: int) -> bool:
 
 
 def cutlass_group_gemm_supported(cuda_device_capability: int) -> bool:
-    return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability)
+    try:
+        return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability)
+    except AttributeError:
+        # Return False on non-CUDA platforms where it is not available
+        return False
 
 
 def cutlass_sparse_compress(a: torch.Tensor) -> tuple[torch.Tensor, torch.Tensor]: