update unit test for kaiming_uniform_

zhiminzhang0830 · zhiminzhang0830 · commit 5b8a1a528ce7 · 2025-08-11T07:03:57.000Z
diff --git a/test/legacy_test/test_nn_init_function.py b/test/legacy_test/test_nn_init_function.py
@@ -21,15 +21,12 @@
 
 import paddle
 from paddle import nn
+from paddle.pir.core import ParameterMeta
 
+DELTA = 0.00001
 
-def get_uniform_min_and_max(weight):
-    min_value = np.min(weight)
-    max_value = np.max(weight)
-    return min_value, max_value
 
-
-class TestKaimingUniform(unittest.TestCase):
+class TestKaimingUniformFunc(unittest.TestCase):
     def _test_kaiming_uniform_common(self, tensor):
         init = paddle.nn.init.kaiming_uniform_
         init(tensor, a=0, mode="fan_in", nonlinearity="leaky_relu")
@@ -54,12 +51,54 @@ def _is_uniform(self, tensor, a, b):
     def _random_float(self, a, b):
         return (b - a) * random.random() + a
 
+    def calculate_gain(self, nonlinearity, param):
+        recommended_gain = {
+            'sigmoid': 1,
+            'linear': 1,
+            'conv1d': 1,
+            'conv2d': 1,
+            'conv3d': 1,
+            'conv1d_transpose': 1,
+            'conv_transpose1d': 1,
+            'conv2d_transpose': 1,
+            'conv_transpose2d': 1,
+            'conv3d_transpose': 1,
+            'conv_transpose3d': 1,
+            'tanh': 5.0 / 3,
+            'relu': math.sqrt(2.0),
+            'leaky_relu': math.sqrt(2.0 / (1 + param**2)),
+            'selu': 3.0 / 4,
+        }
+        return recommended_gain[nonlinearity]
+
+    def test_kaiming_uniform_nonlinearity(self):
+        for nonlinearity in [
+            'conv_transpose1d',
+            'conv_transpose2d',
+            'conv_transpose3d',
+            'relu',
+            'leaky_relu',
+        ]:
+            input_tensor = paddle.zeros([1024, 512])
+            paddle.nn.init.kaiming_uniform_(
+                input_tensor, nonlinearity=nonlinearity
+            )
+
+            fan_in = input_tensor.shape[0]
+
+            expected_std = self.calculate_gain(
+                nonlinearity=nonlinearity, param=0
+            )
+
+            bounds = expected_std * math.sqrt(3.0 / float(fan_in))
+            assert self._is_uniform(input_tensor, -bounds, bounds)
+
     def test_kaiming_uniform(self):
         for use_a in [True, False]:
-            for dims in [2, 4]:
+            for dims in [2, 3, 4]:
                 for mode in ["fan_in", "fan_out"]:
                     input_tensor = self._create_random_nd_tensor(
-                        dims, size_min=20, size_max=25
+                        dims, size_min=20, size_max=108
                     )
                     if use_a:
                         a = self._random_float(0.1, 2)
@@ -86,11 +125,142 @@ def test_kaiming_uniform(self):
                         n = fan_in
                     else:
                         n = fan_out
-
-                    expected_std = math.sqrt(2.0 / ((1 + a**2) * n))
-                    bounds = expected_std * math.sqrt(3.0)
+                    expected_std = self.calculate_gain(
+                        nonlinearity='leaky_relu', param=a
+                    )
+                    bounds = expected_std * math.sqrt(3.0 / float(n))
                     assert self._is_uniform(input_tensor, -bounds, bounds)
 
+    @unittest.skipIf(
+        not paddle.is_compiled_with_cuda(), "core is not compiled with CUDA"
+    )
+    def test_kaiming_uniform_fp16(self):
+        input_tensor = paddle.zeros([1024, 512], dtype='float16')
+        paddle.nn.init.kaiming_uniform_(input_tensor)
+        fan_in = input_tensor.shape[0]
+
+        expected_std = self.calculate_gain(nonlinearity='leaky_relu', param=0)
+
+        bounds = expected_std * math.sqrt(3.0 / float(fan_in))
+        assert self._is_uniform(input_tensor, -bounds, bounds)
+        assert input_tensor.dtype == paddle.float16
+
+
+class TestKaimingUniformFuncPir(unittest.TestCase):
+    def setUp(self):
+        self.init_uniform_op_name = 'pd_op.uniform'
+
+    def get_operand_definition_op_attrs(self, cur_op, operand_name, attr_name):
+        input_names = cur_op.get_input_names()
+        self.assertIn(operand_name, input_names)
+        attr = (
+            cur_op.operand(input_names.index(operand_name))
+            .source()
+            .get_defining_op()
+            .attrs()[attr_name]
+        )
+        return attr
+
+    def get_init_ops_by_op_name(self, block, op_name):
+        checked_ops = []
+        for op in block.ops:
+            # get init op
+            if op_name == op.name():
+                checked_ops.append(op)
+        return checked_ops
+
+    def test_kaiming_uniform_(self):
+        with paddle.pir_utils.IrGuard():
+            main = paddle.static.Program()
+            with paddle.static.program_guard(main, paddle.static.Program()):
+                parameter_meta = ParameterMeta([1024, 512], paddle.float32)
+                init_result = paddle.nn.init.kaiming_uniform_(
+                    parameter_meta, block=main.global_block()
+                )
+                block = main.global_block()
+                checked_ops = self.get_init_ops_by_op_name(
+                    block, self.init_uniform_op_name
+                )
+                self.assertEqual(len(checked_ops), 1)
+                init_op = checked_ops[0]
+                limit = np.sqrt(6.0 / init_result.shape[0])
+
+                min = self.get_operand_definition_op_attrs(
+                    init_op, "min", "value"
+                )
+                max = self.get_operand_definition_op_attrs(
+                    init_op, "max", "value"
+                )
+                self.assertAlmostEqual(min, -limit, delta=DELTA)
+                self.assertAlmostEqual(max, limit, delta=DELTA)
+                self.assertEqual(init_op.attrs()['seed'], 0)
+
+    def test_kaiming_uniform_conv(self):
+        with paddle.pir_utils.IrGuard():
+            main = paddle.static.Program()
+            with paddle.static.program_guard(main, paddle.static.Program()):
+                parameter_meta = ParameterMeta([5, 10, 15, 20], paddle.float32)
+                init_result = paddle.nn.init.kaiming_uniform_(
+                    parameter_meta, block=main.global_block()
+                )
+                block = main.global_block()
+                checked_ops = self.get_init_ops_by_op_name(
+                    block, self.init_uniform_op_name
+                )
+                self.assertEqual(len(checked_ops), 1)
+                init_op = checked_ops[0]
+                limit = np.sqrt(
+                    6.0
+                    / (
+                        init_result.shape[1]
+                        * init_result.shape[2]
+                        * init_result.shape[3]
+                    )
+                )
+
+                min = self.get_operand_definition_op_attrs(
+                    init_op, "min", "value"
+                )
+                max = self.get_operand_definition_op_attrs(
+                    init_op, "max", "value"
+                )
+                self.assertAlmostEqual(min, -limit, delta=DELTA)
+                self.assertAlmostEqual(max, limit, delta=DELTA)
+                self.assertEqual(init_op.attrs()['seed'], 0)
+
+    def test_kaiming_uniform_fan_out(self):
+        with paddle.pir_utils.IrGuard():
+            main = paddle.static.Program()
+            with paddle.static.program_guard(main, paddle.static.Program()):
+                parameter_meta = ParameterMeta([5, 10, 15, 20], paddle.float32)
+                init_result = paddle.nn.init.kaiming_uniform_(
+                    parameter_meta, mode='fan_out', block=main.global_block()
+                )
+                block = main.global_block()
+                checked_ops = self.get_init_ops_by_op_name(
+                    block, self.init_uniform_op_name
+                )
+                self.assertEqual(len(checked_ops), 1)
+                init_op = checked_ops[0]
+                limit = np.sqrt(
+                    6.0
+                    / (
+                        init_result.shape[0]
+                        * init_result.shape[2]
+                        * init_result.shape[3]
+                    )
+                )
+
+                min = self.get_operand_definition_op_attrs(
+                    init_op, "min", "value"
+                )
+                max = self.get_operand_definition_op_attrs(
+                    init_op, "max", "value"
+                )
+                self.assertAlmostEqual(min, -limit, delta=DELTA)
+                self.assertAlmostEqual(max, limit, delta=DELTA)
+                self.assertEqual(init_op.attrs()['seed'], 0)
+
 
 if __name__ == '__main__':
     unittest.main()