revert test changes

xu-shawn · xu-shawn · commit 539af4783a1b · 2025-06-28T11:52:18.000-07:00
diff --git a/feature_transformer.py b/feature_transformer.py
@@ -517,7 +517,7 @@ def FeatureTransformerSliceFunctionEmulate(
 
     def test():
         BATCH_SIZE = 16
-        INPUT_SIZE = 768
+        INPUT_SIZE = 10
         MAX_ACTIVE_FEATURES = 32
         STRIDE = 128
         MAX_ERROR = 1e-4
@@ -574,7 +574,6 @@ def bench():
         MAX_ACTIVE_FEATURES = 64
 
         layer = DoubleFeatureTransformerSlice(INPUT_SIZE, STRIDE).cuda()
-        layer = torch.compile(layer, fullgraph=True, mode="max-autotune")
         indices0 = torch.cat(
             [
                 torch.sort(
@@ -606,38 +605,12 @@ def bench():
             BATCH_SIZE, MAX_ACTIVE_FEATURES, dtype=torch.float32
         ).cuda()
 
-        # Warmup
-        output0, output1 = layer(indices0, values0, indices1, values1)
-        output0 = torch.clamp(output0, 0.0, 1.0)
-        output0 = output0.clone()
-        output1 = output1.clone()
-        output1 = torch.clamp(output1, 0.0, 1.0)
-        g = ((output0 - output1) ** 2).mean()
-        g.backward()
-        torch.cuda.synchronize()
-
-        for _ in range(ITERS):
-            torch.compiler.cudagraph_mark_step_begin()
-            output0, output1 = layer(indices0, values0, indices1, values1)
-            output0 = output0.clone()
-            output1 = output1.clone()
-            output0 = torch.clamp(output0, 0.0, 1.0)
-            output1 = torch.clamp(output1, 0.0, 1.0)
-
-            g = ((output0 - output1) ** 2).mean()
-            g.backward()
-
-            torch.cuda.synchronize()
-
         output0, output1 = layer(indices0, values0, indices1, values1)
 
         start = time.time()
 
         for _ in range(ITERS):
-            torch.compiler.cudagraph_mark_step_begin()
             output0, output1 = layer(indices0, values0, indices1, values1)
-            output0 = output0.clone()
-            output1 = output1.clone()
             output0 = torch.clamp(output0, 0.0, 1.0)
             output1 = torch.clamp(output1, 0.0, 1.0)