support tensor index.

hbwx24 · hbwx24 · commit ec94322cfc3c · 2021-08-11T12:14:22.000Z
diff --git a/paddle/fluid/operators/index_select_op.cc b/paddle/fluid/operators/index_select_op.cc
@@ -46,19 +46,32 @@ class IndexSelectOp : public framework::OperatorWithKernel {
             "to be in range of [-%d, %d]. But received Attr(dim) = %d.",
             input_dim.size(), input_dim.size() - 1, dim));
 
-    PADDLE_ENFORCE_EQ(
-        index_dim.size() == 1 || (index_dim.size() == 2 && index_dim[1] == 1),
-        true, platform::errors::InvalidArgument(
-                  "The 'shape' of Input(Index) must be 1-D tensor. "
-                  "But received: the 'shape' of Input(Index) is [%s], "
-                  "the dimension of Input(Index) is [%d].",
-                  index_dim, index_dim.size()));
-
-    auto output_dim = framework::vectorize(input_dim);
+    // PADDLE_ENFORCE_EQ(
+    //     index_dim.size() == 1 || (index_dim.size() == 2 && index_dim[1] ==
+    //     1),
+    //     true, platform::errors::InvalidArgument(
+    //               "The 'shape' of Input(Index) must be 1-D tensor. "
+    //               "But received: the 'shape' of Input(Index) is [%s], "
+    //               "the dimension of Input(Index) is [%d].",
+    //               index_dim, index_dim.size()));
+
     if (dim < 0) {
       dim += input_dim.size();
     }
-    output_dim[dim] = index_dim[0];
+    // auto output_dim = framework::vectorize(input_dim);
+    // output_dim[dim] = index_dim[0];
+    std::vector<int64_t> output_dim(input_dim.size() + index_dim.size() - 1);
+
+    for (int i = 0; i < static_cast<int>(output_dim.size()); i++) {
+      if (i < dim) {
+        output_dim[i] = input_dim[i];
+      } else if (i < dim + index_dim.size()) {
+        output_dim[i] = index_dim[i - dim];
+      } else {
+        output_dim[i] = input_dim[i - index_dim.size() + 1];
+      }
+    }
+
     ctx->SetOutputDim("Out", framework::make_ddim(output_dim));
     auto type = ctx->GetInputsVarType("X")[0];
     if (type == framework::proto::VarType::LOD_TENSOR) {
diff --git a/paddle/fluid/operators/index_select_op.cu b/paddle/fluid/operators/index_select_op.cu
@@ -77,7 +77,10 @@ class IndexSelectCUDAKernel : public framework::OpKernel<T> {
     dim = dim >= 0 ? dim : dim + input_dim.size();
     auto stride_dim = framework::stride(input_dim);
     int64_t stride = stride_dim[dim];
-    int64_t size = output_dim[dim];
+    int64_t size = 1;
+    for (int i = 0; i < index->dims().size(); i++) {
+      size *= output_dim[dim + i];
+    }
     int64_t delta = input_dim[dim] - size;
 
     const auto& index_type = index->type();
@@ -143,7 +146,12 @@ class IndexSelectGradCUDAKernel : public framework::OpKernel<T> {
     dim = dim >= 0 ? dim : dim + input_dim.size();
     auto stride_dim = framework::stride(input_dim);
     int64_t stride = stride_dim[dim];
-    int64_t size = input_dim[dim];
+
+    int64_t size = 1;
+    for (int i = 0; i < index->dims().size(); i++) {
+      size *= input_dim[dim + i];
+    }
+
     int64_t delta = output_dim[dim] - size;
 
     const auto& index_type = index->type();
diff --git a/paddle/fluid/operators/index_select_op.h b/paddle/fluid/operators/index_select_op.h
@@ -46,8 +46,12 @@ void IndexSelectInner(const framework::ExecutionContext& context,
   for (auto i = 0; i < dim; i++) {
     outer_nums *= input_dim[i];
   }
-
-  auto index_size = index.dims()[0];
+  int index_size = 1;
+  auto index_dim = index.dims();
+  for (int i = 0; i < index_dim.size(); i++) {
+    index_size *= index.dims()[i];
+  }
+  // auto index_size = index.dims()[0];
 
   std::vector<T> input_vec;
   std::vector<IndexT> index_vec;
@@ -179,7 +183,18 @@ void IndexSelectGradInner(const framework::ExecutionContext& context,
     outer_nums *= input_dim[i];
   }
 
-  auto index_size = index->dims()[0];
+  // auto index_size = index->dims()[0];cmake .. -DPY_VERSION=3.7 -DWITH_GPU=ON
+  // -DWITH_TESTING=ON -DCMAKE_BUILD_TYPE=Release
+  int index_size = index->numel();
+
+  for (int i = 0; i < index_size; i++) {
+    PADDLE_ENFORCE_LE(
+        index_data[i], input_dim[dim],
+        platform::errors::InvalidArgument(
+            "Element of index should be less than %d, but received %d.",
+            input_dim[dim], index_data[dim]));
+  }
+
   VLOG(3) << "Index_Select_Grad_Debug; outer_nums: " << outer_nums
           << "; slice_size: " << slice_size << "; input_width: " << input_width
           << "; output_width: " << output_width
diff --git a/python/paddle/fluid/tests/unittests/test_index_select_op.py b/python/paddle/fluid/tests/unittests/test_index_select_op.py
@@ -21,6 +21,7 @@
 from op_test import OpTest
 import paddle.fluid as fluid
 from paddle.fluid import Program, program_guard
+from functools import reduce
 
 
 class TestIndexSelectOp(OpTest):
@@ -131,5 +132,99 @@ def test_dygraph_api(self):
         self.assertTrue(np.allclose(expect_out, np_z))
 
 
+class TestTensorIndex(unittest.TestCase):
+    def numel(self, shape):
+        return reduce(lambda x, y: x * y, shape)
+
+    def test_dygraph(self):
+        paddle.disable_static()
+
+        inps_shape = [7, 6, 5, 4, 3]
+        array = np.arange(self.numel(inps_shape)).reshape(inps_shape)
+
+        index_shape = [7, 6, 5, 4, 3]
+        index = np.arange(self.numel(index_shape)).reshape(index_shape)
+        for i in range(len(inps_shape) - 1):
+
+            pt = paddle.to_tensor(array)
+            index_mod = index % (array.shape[0])
+            pindex = paddle.to_tensor(index_mod)
+            getitem_np = array[index_mod]
+            getitem_pp = pt[pindex]
+            self.assertTrue(np.array_equal(getitem_np, getitem_pp.numpy()))
+            array = array[0]
+            index = index[0]
+
+    def test_static_graph(self):
+        paddle.enable_static()
+        inps_shape = [1, 2, 3, 4, 5]
+        array = np.arange(
+            self.numel(inps_shape), dtype='float32').reshape(inps_shape)
+
+        index_shape = [7, 6, 5, 4, 3]
+        index = np.arange(self.numel(index_shape)).reshape(index_shape)
+
+        for i in range(len(inps_shape) - 1):
+            index_mod = index % (array.shape[0])
+            program = paddle.static.Program()
+
+            with paddle.static.program_guard(program):
+                x = paddle.static.data(
+                    name='x', shape=array.shape, dtype='float32')
+                if i % 2 == 0:
+                    index_dtype = 'int32'
+                    index_mod = index_mod.astype('int32')
+                else:
+                    index_dtype = 'int64'
+                    index_mod = index_mod.astype('int64')
+
+                index_p = paddle.static.data(
+                    name='index', shape=index.shape, dtype=index_dtype)
+
+                y = x[index_p]
+
+                place = paddle.fluid.CPUPlace(
+                ) if not paddle.fluid.core.is_compiled_with_cuda(
+                ) else paddle.fluid.CUDAPlace(0)
+
+                prog = paddle.static.default_main_program()
+                exe = paddle.static.Executor(place)
+
+                exe.run(paddle.static.default_startup_program())
+                fetch_list = [y.name]
+                getitem_pp = exe.run(
+                    prog,
+                    feed={x.name: array,
+                          index_p.name: index_mod},
+                    fetch_list=fetch_list)
+
+                getitem_np = array[index_mod]
+                self.assertTrue(np.array_equal(getitem_np, getitem_pp[0]))
+
+            array = array[0]
+            index = index[0]
+
+    def test_backward(self):
+        paddle.disable_static()
+        array = np.arange(4 * 3 * 2, dtype='float32').reshape([4, 3, 2])
+        index = [[1, 2], [0, 3]]
+
+        index_p = paddle.to_tensor(index)
+        pt = paddle.to_tensor(array, stop_gradient=False)
+
+        y = pt[index_p]
+        y = y * y
+        loss = y.sum()
+        loss.backward()
+        grad_torch = np.array([[[0., 2.], [4., 6.], [8., 10.]],
+                               [[12., 14.], [16., 18.], [20., 22.]],
+                               [[24., 26.], [28., 30.],
+                                [32., 34.]], [[36., 38.], [40., 42.],
+                                              [44., 46.]]])
+        self.assertTrue(
+            np.array_equal(pt.grad.numpy(), grad_torch),
+            msg='grad of index_select_op:\n{}'.format(pt.grad.numpy()))
+
+
 if __name__ == '__main__':
     unittest.main()