test=develop

zhupengyang · zhupengyang · commit f13371e9a09a · 2021-04-09T07:47:54.000Z
diff --git a/lite/kernels/host/sequence_mask_compute.cc b/lite/kernels/host/sequence_mask_compute.cc
@@ -19,32 +19,62 @@ namespace lite {
 namespace kernels {
 namespace host {
 
+template <class Tx, class Ty>
+void SequenceMask(const Tx* x, Ty* y, const int x_size, const int max_len) {
+  memset(y, 0, sizeof(Ty) * x_size * max_len);
+  for (int i = 0; i < x_size; i++) {
+    for (int j = 0; j < max_len; j++) {
+      y[j] = static_cast<Ty>(static_cast<Tx>(j) < x[i] ? 1 : 0);
+    }
+    y += max_len;
+  }
+}
+
 template <class T>
 void SequenceMaskCompute<T>::Run() {
   auto& param = this->template Param<param_t>();
   auto* x = param.X;
-  auto* y = parm.Y;
-  int maxlen = param.maxlen;
+  auto* y = param.Y;
+  int max_len = param.maxlen;
   auto* max_len_tensor = param.MaxLenTensor;
   if (max_len_tensor != nullptr) {
-    maxlen = max_len_tensor->template data<int>()[0];
-    CHECK_GT(maxlen, 0) << "Input(MaxLenTensor)'s value should be greater than "
-                           "0. But received maxlen: "
-                        << maxlen;
+    max_len = max_len_tensor->template data<int>()[0];
+    CHECK_GT(max_len, 0)
+        << "Input(MaxLenTensor)'s value should be greater than "
+           "0. But received maxlen: "
+        << max_len;
   }
 
   auto* x_data = x->template data<T>();
-  auto x_size = x->numel();
-  if (maxlen < 0) {
-    maxlen = static_cast<int>(*std::max_element(x_data, x_data + x_size));
+  int x_size = static_cast<int>(x->numel());
+  if (max_len < 0) {
+    max_len = static_cast<int>(*std::max_element(x_data, x_data + x_size));
   }
 
   auto y_shape = x->dims().Vectorize();
-  y_shape.push_back(static_cast<int64_t>(maxlen));
+  y_shape.push_back(static_cast<int64_t>(max_len));
   y->Resize(y_shape);
   y->set_lod(x->lod());
 
   int out_type = param.out_dtype;
+  switch (lite::core::FluidType(out_type)) {
+    case lite::core::FluidType::FP32: {
+      SequenceMask(x_data, y->template mutable_data<float>(), x_size, max_len);
+      break;
+    }
+    case lite::core::FluidType::INT32: {
+      SequenceMask(x_data, y->template mutable_data<int>(), x_size, max_len);
+      break;
+    }
+    case lite::core::FluidType::INT64: {
+      SequenceMask(
+          x_data, y->template mutable_data<int64_t>(), x_size, max_len);
+      break;
+    }
+    default:
+      LOG(FATAL) << "unsupported out data type: " << out_type;
+      break;
+  }
 }
 
 }  // namespace host
@@ -61,8 +91,7 @@ REGISTER_LITE_KERNEL(sequence_mask,
     .BindInput("X", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kFloat))})
     .BindInput("MaxLenTensor",
                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kInt32))})
-    .BindOutput("Output",
-                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
+    .BindOutput("Y", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
     .Finalize();
 
 REGISTER_LITE_KERNEL(sequence_mask,
@@ -74,8 +103,7 @@ REGISTER_LITE_KERNEL(sequence_mask,
     .BindInput("X", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kInt32))})
     .BindInput("MaxLenTensor",
                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kInt32))})
-    .BindOutput("Output",
-                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
+    .BindOutput("Y", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
     .Finalize();
 
 REGISTER_LITE_KERNEL(sequence_mask,
@@ -87,6 +115,5 @@ REGISTER_LITE_KERNEL(sequence_mask,
     .BindInput("X", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kInt64))})
     .BindInput("MaxLenTensor",
                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kInt32))})
-    .BindOutput("Output",
-                {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
+    .BindOutput("Y", {LiteType::GetTensorTy(TARGET(kHost), PRECISION(kAny))})
     .Finalize();
diff --git a/lite/tests/kernels/CMakeLists.txt b/lite/tests/kernels/CMakeLists.txt
@@ -65,6 +65,7 @@ if((NOT LITE_WITH_FPGA AND NOT LITE_WITH_BM AND NOT LITE_WITH_MLU) AND (LITE_WIT
 if(LITE_BUILD_EXTRA)
     lite_cc_test(test_gru_unit SRCS gru_unit_test.cc DEPS ${test_kernel_deps})
     lite_cc_test(test_sequence_pad SRCS sequence_pad_test.cc DEPS ${test_kernel_deps})
+    lite_cc_test(test_sequence_mask SRCS sequence_mask_test.cc DEPS ${test_kernel_deps})
     lite_cc_test(test_correlation SRCS correlation_test.cc DEPS ${test_kernel_deps})
     #lite_cc_test(test_kernel_sequence_pool_compute SRCS sequence_pool_compute_test.cc DEPS ${test_kernel_deps})
     lite_cc_test(test_kernel_sequence_conv_compute SRCS sequence_conv_compute_test.cc DEPS ${test_kernel_deps})
diff --git a/lite/tests/kernels/sequence_mask_test.cc b/lite/tests/kernels/sequence_mask_test.cc
@@ -0,0 +1,173 @@
+// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <gtest/gtest.h>
+#include <cmath>
+#include "lite/api/paddle_use_kernels.h"
+#include "lite/api/paddle_use_ops.h"
+#include "lite/core/arena/framework.h"
+#include "lite/tests/utils/fill_data.h"
+
+namespace paddle {
+namespace lite {
+
+template <class Tx, class Ty>
+void SequenceMask(const Tx* x, Ty* y, const int x_size, const int max_len) {
+  memset(y, 0, sizeof(Ty) * x_size * max_len);
+  for (int i = 0; i < x_size; i++) {
+    int step = static_cast<int>(std::ceil(static_cast<float>(x[i])));
+    for (int j = 0; j < step; j++) {
+      y[j] = static_cast<Ty>(1);
+    }
+    y += max_len;
+  }
+}
+
+template <class T>
+class SequenceMaskTester : public arena::TestCase {
+ protected:
+  std::string x_ = "x";
+  std::string max_len_tensor_;
+  std::string y_ = "y";
+  int max_len_{-1};
+  int out_type_{5};
+  DDim x_dims_{{2, 3, 4}};
+
+ public:
+  SequenceMaskTester(const Place& place,
+                     const std::string& alias,
+                     const int max_len = 5,
+                     const int out_type = 5,
+                     const bool use_max_len_tensor = false)
+      : TestCase(place, alias), max_len_(max_len), out_type_(out_type) {
+    if (use_max_len_tensor) {
+      max_len_tensor_ = std::string("max_len_tensor");
+    }
+  }
+
+  void RunBaseline(Scope* scope) override {
+    auto* y = scope->NewTensor(y_);
+    auto y_shape = x_dims_.Vectorize();
+    y_shape.push_back(static_cast<int64_t>(max_len_));
+    y->Resize(y_shape);
+
+    auto* x = scope->FindTensor(x_);
+    auto* x_data = x->template data<T>();
+    int x_size = static_cast<int>(x->numel());
+
+    switch (out_type_) {
+      case 5: {
+        SequenceMask(
+            x_data, y->template mutable_data<float>(), x_size, max_len_);
+        break;
+      }
+      case 2: {
+        SequenceMask(x_data, y->template mutable_data<int>(), x_size, max_len_);
+        break;
+      }
+      case 3: {
+        SequenceMask(
+            x_data, y->template mutable_data<int64_t>(), x_size, max_len_);
+        break;
+      }
+      default:
+        LOG(FATAL) << "unsupported out data type: " << out_type_;
+        break;
+    }
+  }
+
+  void PrepareOpDesc(cpp::OpDesc* op_desc) {
+    op_desc->SetType("sequence_mask");
+    op_desc->SetInput("X", {x_});
+    if (!max_len_tensor_.empty()) {
+      op_desc->SetInput("MaxLenTensor", {max_len_tensor_});
+      op_desc->SetAttr("maxlen", -1);
+    } else {
+      op_desc->SetAttr("maxlen", max_len_);
+    }
+    op_desc->SetOutput("Y", {y_});
+    op_desc->SetAttr("out_dtype", out_type_);
+  }
+
+  void PrepareData() override {
+    std::vector<T> x_data(x_dims_.production());
+    fill_data_rand<T>(x_data.data(), 0, 4, x_dims_.production());
+    SetCommonTensor(x_, x_dims_, x_data.data());
+
+    if (!max_len_tensor_.empty()) {
+      std::vector<int> max_len_tensor_data{max_len_};
+      SetCommonTensor(max_len_tensor_, DDim{{1}}, max_len_tensor_data.data());
+    }
+  }
+};
+
+template <class T>
+void TestSequenceMaskHelper(const Place place,
+                            const float abs_error,
+                            const int max_len = 5,
+                            const int out_type = 5,
+                            const bool use_max_len_tensor = false) {
+  std::string alias;
+  auto precision = lite_api::PrecisionTypeTrait<T>::Type();
+  switch (precision) {
+    case PRECISION(kFloat):
+      alias = std::string("def");
+      break;
+    case PRECISION(kInt32):
+      alias = std::string("int32");
+      break;
+    case PRECISION(kInt64):
+      alias = std::string("int64");
+      break;
+    default:
+      LOG(FATAL) << "unsupported input data type: "
+                 << lite_api::PrecisionToStr(precision);
+      break;
+  }
+  std::unique_ptr<arena::TestCase> tester(new SequenceMaskTester<T>(
+      place, alias, max_len, out_type, use_max_len_tensor));
+  arena::Arena arena(std::move(tester), place, abs_error);
+  arena.TestPrecision();
+}
+
+template <class T>
+void TestSequenceMask(const Place place, const float abs_error) {
+  // test max_len
+  for (int max_len : {6}) {
+    TestSequenceMaskHelper<T>(place, abs_error, max_len);
+  }
+  // test out_type
+  for (int out_type : {2, 3, 5}) {
+    TestSequenceMaskHelper<T>(place, abs_error, 5, out_type);
+  }
+  // test max_len_tensor
+  TestSequenceMaskHelper<T>(place, abs_error, 5, 5, true);
+}
+
+TEST(sequence_mask, precision) {
+  Place place;
+  float abs_error = 1e-5;
+#if defined(LITE_WITH_ARM) || defined(LITE_WITH_X86)
+  place = TARGET(kHost);
+#else
+  return;
+#endif
+
+  TestSequenceMask<float>(place, abs_error);
+  TestSequenceMask<int>(place, abs_error);
+  TestSequenceMask<int64_t>(place, abs_error);
+}
+
+}  // namespace lite
+}  // namespace paddle