From d7a243f32feb30ad4b844ae2c9534a9fa9241733 Mon Sep 17 00:00:00 2001 From: zhewenli Date: Sun, 2 Nov 2025 15:54:49 -0800 Subject: [PATCH] update test Signed-off-by: zhewenli --- vllm/_custom_ops.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py index 657b11046809..cfcf534c613f 100644 --- a/vllm/_custom_ops.py +++ b/vllm/_custom_ops.py @@ -836,7 +836,11 @@ def cutlass_sparse_scaled_mm_supported(cuda_device_capability: int) -> bool: def cutlass_group_gemm_supported(cuda_device_capability: int) -> bool: - return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability) + try: + return torch.ops._C.cutlass_group_gemm_supported(cuda_device_capability) + except AttributeError: + # Return False on non-CUDA platforms where it is not available + return False def cutlass_sparse_compress(a: torch.Tensor) -> tuple[torch.Tensor, torch.Tensor]: