From d7a243f32feb30ad4b844ae2c9534a9fa9241733 Mon Sep 17 00:00:00 2001
From: zhewenli <zhewenli@meta.com>
Date: Sun, 2 Nov 2025 15:54:49 -0800
Subject: [PATCH] update test

Signed-off-by: zhewenli <zhewenli@meta.com>
---
 vllm/_custom_ops.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py
index 657b11046809..cfcf534c613f 100644
--- a/vllm/_custom_ops.py
+++ b/vllm/_custom_ops.py
@@ -836,7 +836,11 @@ def cutlass_sparse_scaled_mm_supported(cuda_device_capability: int) -> bool:
 
 
 def cutlass_group_gemm_supported(cuda_device_capability: int) -> bool:
-    return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability)
+    try:
+        return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability)
+    except AttributeError:
+        # Return False on non-CUDA platforms where it is not available
+        return False
 
 
 def cutlass_sparse_compress(a: torch.Tensor) -> tuple[torch.Tensor, torch.Tensor]: