[GCU] Add custom_engine ppocr_cls testcase (#1616)

EnflameGCU · web-flow · commit 8b20ca3c4da3 · 2025-03-21T15:07:46.000+08:00
diff --git a/backends/gcu/custom_engine/ir_translator/operators/reshape.cc b/backends/gcu/custom_engine/ir_translator/operators/reshape.cc
@@ -38,3 +38,4 @@ static GcuOpPtr TranslateReshape(
 }  // namespace custom_engine
 
 REGISTER_OP_TRANSLATOR(pd_op_reshape, custom_engine::TranslateReshape)
+REGISTER_OP_TRANSLATOR(pd_op_reshape_, custom_engine::TranslateReshape)
diff --git a/backends/gcu/custom_engine/ir_translator/operators/shape.cc b/backends/gcu/custom_engine/ir_translator/operators/shape.cc
@@ -0,0 +1,34 @@
+// Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <vector>
+
+#include "custom_engine/ir_translator/translator_registry.h"
+
+namespace custom_engine {
+
+static GcuOpPtr TranslateShape(
+    GcuBuilderPtr gcu_builder,
+    const pir::Operation *op,
+    const std::vector<std::vector<GcuOpPtr>> &gcu_op_inputs) {
+  auto x = *(gcu_op_inputs[0][0]);
+  auto out = builder::Shape(x);
+  out = builder::Convert(
+      out, {out.GetType().GetShape(), builder::PrimitiveType::S32()});
+  return std::make_shared<GcuOp>(out);
+}
+
+}  // namespace custom_engine
+
+REGISTER_OP_TRANSLATOR(pd_op_shape, custom_engine::TranslateShape)
diff --git a/backends/gcu/custom_engine/ir_translator/operators/slice.cc b/backends/gcu/custom_engine/ir_translator/operators/slice.cc
@@ -0,0 +1,128 @@
+// Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <vector>
+
+#include "custom_engine/ir_translator/translator_registry.h"
+
+namespace custom_engine {
+
+static GcuOpPtr TranslateSlice(
+    GcuBuilderPtr gcu_builder,
+    const pir::Operation *op,
+    const std::vector<std::vector<GcuOpPtr>> &gcu_op_inputs) {
+  // Get attributes
+  const auto &attributes = op->attributes();
+  auto axes_list =
+      attributes.at("axes").dyn_cast<pir::ArrayAttribute>().AsVector();
+  std::vector<int64_t> axes;
+  if (axes_list.size() > 0) {
+    PADDLE_ENFORCE_EQ(axes_list[0].isa<pir::Int64Attribute>(),
+                      true,
+                      common::errors::Unimplemented(
+                          "the 0th axes MUST be pir::Int64Attribute"));
+    for (size_t i = 0; i < axes_list.size(); ++i) {
+      axes.push_back(axes_list[i].dyn_cast<pir::Int64Attribute>().data());
+    }
+  }
+
+  auto infer_flags_list =
+      attributes.at("infer_flags").dyn_cast<pir::ArrayAttribute>().AsVector();
+  std::vector<int64_t> infer_flags;
+  if (infer_flags_list.size() > 0) {
+    PADDLE_ENFORCE_EQ(infer_flags_list[0].isa<pir::Int64Attribute>(),
+                      true,
+                      common::errors::Unimplemented(
+                          "the 0th infer_flags MUST be pir::Int64Attribute"));
+    for (size_t i = 0; i < infer_flags_list.size(); ++i) {
+      infer_flags.push_back(
+          infer_flags_list[i].dyn_cast<pir::Int64Attribute>().data());
+    }
+  }
+
+  auto decrease_axis_list =
+      attributes.at("decrease_axis").dyn_cast<pir::ArrayAttribute>().AsVector();
+  std::vector<int64_t> decrease_axis;
+  if (decrease_axis_list.size() > 0) {
+    PADDLE_ENFORCE_EQ(decrease_axis_list[0].isa<pir::Int64Attribute>(),
+                      true,
+                      common::errors::Unimplemented(
+                          "the 0th decrease_axis MUST be pir::Int64Attribute"));
+    for (size_t i = 0; i < decrease_axis_list.size(); ++i) {
+      decrease_axis.push_back(
+          decrease_axis_list[i].dyn_cast<pir::Int64Attribute>().data());
+    }
+  }
+
+  auto input = *(gcu_op_inputs[0][0]);
+
+  auto starts_tensor = *(gcu_op_inputs[1][0]);
+  PADDLE_ENFORCE_EQ(starts_tensor.IsConstant(),
+                    true,
+                    common::errors::PreconditionNotMet(
+                        "Input[1] starts_tensor is not a Constant."));
+  auto starts = starts_tensor.GetConstData<int64_t>();
+
+  auto ends_tensor = *(gcu_op_inputs[2][0]);
+  PADDLE_ENFORCE_EQ(ends_tensor.IsConstant(),
+                    true,
+                    common::errors::PreconditionNotMet(
+                        "Input[1] ends_tensor is not a Constant."));
+  auto ends = ends_tensor.GetConstData<int64_t>();
+
+  auto rank = input.GetType().GetRank();
+  const std::vector<int64_t> &input_shapes = input.GetType().GetShape();
+  std::vector<int64_t> start_indices(rank, 0);
+  std::vector<int64_t> limit_indices = input_shapes;
+  for (size_t i = 0; i < axes.size(); ++i) {
+    int dim = axes[i];
+    if (dim < 0) {
+      dim += rank;
+    }
+    start_indices[dim] =
+        starts[i] < 0 ? starts[i] + input_shapes[dim] : starts[i];
+    start_indices[dim] = std::max(start_indices[dim], 0L);
+    start_indices[dim] = std::min(start_indices[dim], input_shapes[dim]);
+
+    limit_indices[dim] = ends[i] < 0 ? ends[i] + input_shapes[dim] : ends[i];
+    limit_indices[dim] = std::min(limit_indices[dim], input_shapes[dim]);
+    limit_indices[dim] = std::max(limit_indices[dim], 0L);
+  }
+  std::vector<int64_t> strides(rank, 1);
+
+  auto slice = builder::Slice(input, start_indices, limit_indices, strides);
+
+  if (decrease_axis.size() == 0) {
+    return std::make_shared<GcuOp>(slice);
+  } else {
+    auto slice_shape = slice.GetType().GetShape();
+    std::vector<int64_t> new_shape;
+    size_t iter = 0;
+    for (int64_t i = 0; i < static_cast<int64_t>(slice_shape.size()); ++i) {
+      if (iter < decrease_axis.size() && i == decrease_axis[iter]) {
+        ++iter;
+      } else {
+        new_shape.emplace_back(slice_shape[i]);
+      }
+    }
+    if (new_shape.empty()) {
+      new_shape.emplace_back(1);
+    }
+    return std::make_shared<GcuOp>(builder::Reshape(slice, new_shape));
+  }
+}
+
+}  // namespace custom_engine
+
+REGISTER_OP_TRANSLATOR(pd_op_slice, custom_engine::TranslateSlice)
diff --git a/backends/gcu/custom_engine/ir_translator/operators/softmax.cc b/backends/gcu/custom_engine/ir_translator/operators/softmax.cc
@@ -0,0 +1,67 @@
+// Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <vector>
+
+#include "custom_engine/ir_translator/translator_registry.h"
+
+namespace custom_engine {
+
+static GcuOpPtr TranslateSoftmax(
+    GcuBuilderPtr gcu_builder,
+    const pir::Operation* op,
+    const std::vector<std::vector<GcuOpPtr>>& gcu_op_inputs) {
+  auto input = *(gcu_op_inputs[0][0]);
+
+  // Get attributes
+  const auto& attributes = op->attributes();
+  int64_t axis = static_cast<int64_t>(
+      attributes.at("axis").dyn_cast<pir::Int32Attribute>().data());
+
+  if (!(input.GetType().GetPrimitiveType() == builder::PrimitiveType::F32()) &&
+      !(input.GetType().GetPrimitiveType() == builder::PrimitiveType::F64())) {
+    PADDLE_THROW(phi::errors::Unimplemented(
+        "GCU softmax only support FP32/FP64 datatype so far as now!"));
+  }
+
+  // to avoid 0
+  double max_value_d = 1.0;
+  double min_value_d = 1e-16;
+  float max_value_f = 1.0;
+  float min_value_f = 1e-7;
+  void* max_ptr = nullptr;
+  void* min_ptr = nullptr;
+  auto scalar_type = builder::Type(input.GetType().GetPrimitiveType());
+  if (input.GetType().GetPrimitiveType() == builder::PrimitiveType::F32()) {
+    max_ptr = static_cast<void*>(&max_value_f);
+    min_ptr = static_cast<void*>(&min_value_f);
+  } else if (input.GetType().GetPrimitiveType() ==
+             builder::PrimitiveType::F64()) {
+    max_ptr = static_cast<void*>(&max_value_d);
+    min_ptr = static_cast<void*>(&min_value_d);
+  } else {
+    PADDLE_THROW(phi::errors::InvalidArgument("Unsupported datatype"));
+  }
+
+  auto max_op = builder::Const(gcu_builder, max_ptr, scalar_type);
+  auto min_op = builder::Const(gcu_builder, min_ptr, scalar_type);
+  auto softmax = builder::Softmax(input, axis, true, false, 0.0);
+  auto res = builder::Clamp(min_op, softmax, max_op);
+  return std::make_shared<GcuOp>(res);
+}
+
+}  // namespace custom_engine
+
+REGISTER_OP_TRANSLATOR(pd_op_softmax, custom_engine::TranslateSoftmax)
+REGISTER_OP_TRANSLATOR(pd_op_softmax_, custom_engine::TranslateSoftmax)
diff --git a/backends/gcu/passes/gcu_op_marker_pass.cc b/backends/gcu/passes/gcu_op_marker_pass.cc
@@ -80,7 +80,10 @@ DEFINE_GENERAL_PATTERN(Pool2d, paddle::dialect::Pool2dOp)
 DEFINE_GENERAL_PATTERN(Relu, paddle::dialect::ReluOp)
 DEFINE_GENERAL_PATTERN(Relu_, paddle::dialect::Relu_Op)
 DEFINE_GENERAL_PATTERN(Reshape, paddle::dialect::ReshapeOp)
+DEFINE_GENERAL_PATTERN(Shape, paddle::dialect::ShapeOp)
 DEFINE_GENERAL_PATTERN(Sigmoid, paddle::dialect::SigmoidOp)
+DEFINE_GENERAL_PATTERN(Slice, paddle::dialect::SliceOp)
+DEFINE_GENERAL_PATTERN(Softmax, paddle::dialect::SoftmaxOp)
 DEFINE_GENERAL_PATTERN(Sqrt, paddle::dialect::SqrtOp)
 DEFINE_GENERAL_PATTERN(Where, paddle::dialect::WhereOp)
 
@@ -127,7 +130,10 @@ class GcuOpMarkerPass : public pir::PatternRewritePass {
     ADD_PATTERN(Relu)
     ADD_PATTERN(Relu_)
     ADD_PATTERN(Reshape)
+    // ADD_PATTERN(Shape)
     ADD_PATTERN(Sigmoid)
+    // ADD_PATTERN(Slice)
+    ADD_PATTERN(Softmax)
     ADD_PATTERN(Sqrt)
     ADD_PATTERN(Where)
 
diff --git a/backends/gcu/tests/fuse_pass/test_custom_engine_ppocr_cls.py b/backends/gcu/tests/fuse_pass/test_custom_engine_ppocr_cls.py

Original file line number	Diff line number	Diff line change
`@@ -38,3 +38,4 @@ static GcuOpPtr TranslateReshape(`
`38`	`38`	`} // namespace custom_engine`
`39`	`39`
`40`	`40`	`REGISTER_OP_TRANSLATOR(pd_op_reshape, custom_engine::TranslateReshape)`
	`41`	`+REGISTER_OP_TRANSLATOR(pd_op_reshape_, custom_engine::TranslateReshape)`