sgl-project · zhyncs · Jun 1, 2025 · Jun 1, 2025 · Jun 1, 2025 · Jun 1, 2025
@@ -41,8 +41,14 @@ def _to_tensor_scalar_tuple(x):
         return (None, x)
 
 
+_IS_HOPPER_ARCH = None
 from sgl_kernel.utils import get_cuda_stream, is_hopper_arch 
 from sgl_kernel.utils import get_cuda_stream, is_hopper_arch 
+
+
 def is_hopper_arch() -> bool:
-    # Hopper arch's compute capability == 9.0
-    device = torch.cuda.current_device()
-    major, minor = torch.cuda.get_device_capability(device)
-    return major == 9
+    global _IS_HOPPER_ARCH
+    if _IS_HOPPER_ARCH is None:
+        # Hopper arch's compute capability == 9.0
+        device = torch.cuda.current_device()
+        major, _ = torch.cuda.get_device_capability(device)
+        _IS_HOPPER_ARCH = major == 9
+    return _IS_HOPPER_ARCH