NVIDIA · shwina · Jan 5, 2026 · Jan 4, 2026 · Jan 5, 2026 · oleksandr-pavlyk
@@ -25,6 +25,7 @@
 from __future__ import annotations
 
 import enum
+import itertools
 import textwrap
 from typing import TYPE_CHECKING
 
@@ -36,6 +37,10 @@
 if TYPE_CHECKING:
     from numba.core.typing import Signature
 
+# Global counter to generate unique symbol names even when the same function
+# is used multiple times (e.g., as both selectors in `three_way_partition`).
+_wrapper_name_counter = itertools.count()
+
 __all__ = [
     "create_op_void_ptr_wrapper",
     "create_advance_void_ptr_wrapper",
@@ -146,9 +151,9 @@ def _create_void_ptr_wrapper(
     arg_str = ", ".join(arg_names)
     void_sig = types.void(*(types.voidptr for _ in arg_specs))
 
-    # Create unique wrapper name
+    # Create unique wrapper name using global counter
     sanitized_name = sanitize_identifier(name)
-    unique_suffix = hex(id(func))[2:]
+    unique_suffix = next(_wrapper_name_counter)
     wrapper_name = f"wrapped_{sanitized_name}_{unique_suffix}"
 
     # We need exec() here because Numba's @intrinsic decorator requires:

@@ -47,10 +47,6 @@ def __init__(
         self.discard_second = DiscardIterator(d_out)
         self.discard_unselected = DiscardIterator(d_out)
 
-        # Create a predicate that always returns False
-        def _cccl_always_false(x):
-            return False
-
         # Use three_way_partition internally
         self.partitioner = make_three_way_partition(
             d_in,
@@ -59,7 +55,7 @@ def _cccl_always_false(x):
             self.discard_unselected,  # unselected_out - discarded
             d_num_selected_out,
             cond,  # select_first_part_op - user's select condition
-            _cccl_always_false,  # select_second_part_op - always false
+            lambda x: False,  # select_second_part_op - always false
         )
 
     def __call__(

@@ -342,6 +342,36 @@ def greater_equal_op(x):
     np.testing.assert_array_equal(got_unselected, h_in)
 
 
+def test_three_way_partition_same_predicate():
+    dtype = np.int32
+    num_items = 100
+    h_in = random_array(num_items, dtype, max_value=100)
+
+    def always_true(x):
+        return True
+
+    d_in = cp.asarray(h_in)
+    d_first = cp.empty_like(d_in)
+    d_second = cp.empty_like(d_in)
+    d_unselected = cp.empty_like(d_in)
+    d_num_selected = cp.empty(2, dtype=np.int64)
+
+    cuda.compute.three_way_partition(
+        d_in,
+        d_first,
+        d_second,
+        d_unselected,
+        d_num_selected,
+        always_true,
+        always_true,
+        num_items,
+    )
+
+    num_selected = d_num_selected.get()
+    assert int(num_selected[0]) == num_items
+    assert int(num_selected[1]) == 0
+
+
 def test_three_way_partition_all_selected_first():
     dtype = np.int32
     num_items = 20_000