elementwise_ops.cc 5.4 KB
Newer Older
Y
Yan Chunwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

15
#include "lite/kernels/npu/bridges/graph.h"
Z
zhupengyang 已提交
16
#include "lite/kernels/npu/bridges/registry.h"
17
#include "lite/kernels/npu/bridges/utility.h"
Y
Yan Chunwei 已提交
18 19 20

namespace paddle {
namespace lite {
21
namespace subgraph {
Y
Yan Chunwei 已提交
22 23
namespace npu {

24 25 26
std::vector<int64_t> CvtYShape(const DDim& x_dims,
                               const DDim& y_dims,
                               int axis) {
27
  CHECK_EQ(x_dims.size(), 4UL) << "[NPU] Only support 4-dimension x";
28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
  CHECK_GE(x_dims.size(), y_dims.size());

  if (axis < 0) {
    axis += x_dims.size();
  }

  std::vector<int64_t> y_new_shape(y_dims.Vectorize());
  if (y_new_shape.size() == 4UL) {
    return y_new_shape;
  }
  for (int i = 0; i < axis; i++) {
    y_new_shape.insert(y_new_shape.begin(), 1);
  }
  while (y_new_shape.size() < 4) {
    y_new_shape.push_back(1);
  }
  CHECK_EQ(y_new_shape.size(), 4UL);
  return y_new_shape;
}

48
int ElementwiseConverter(void* ctx, OpLite* op, KernelBase* kernel) {
49 50 51 52
  CHECK(ctx != nullptr);
  CHECK(op != nullptr);
  auto graph = static_cast<Graph*>(ctx);
  auto op_info = op->op_info();
53
  auto op_type = op_info->Type();
54 55
  auto scope = op->scope();
  VLOG(3) << "[NPU] Converting " + op_type + "...";
56

57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73
  // Get input and output vars and op attributes
  auto x_name = op_info->Input("X").front();
  auto x_type = kernel->GetInputDeclType("X");
  CHECK(x_type->precision() == PRECISION(kFloat));
  CHECK(x_type->layout() == DATALAYOUT(kNCHW));
  auto x = scope->FindMutableTensor(x_name);
  auto x_dims = x->dims();
  auto y_name = op_info->Input("Y").front();
  auto y_type = kernel->GetInputDeclType("Y");
  CHECK(y_type->precision() == PRECISION(kFloat));
  CHECK(y_type->layout() == DATALAYOUT(kNCHW));
  auto y = scope->FindMutableTensor(y_name);
  auto y_dims = y->dims();
  auto out_name = op_info->Output("Out").front();
  auto out_type = kernel->GetOutputDeclType("Out");
  CHECK(out_type->precision() == PRECISION(kFloat));
  CHECK(out_type->layout() == DATALAYOUT(kNCHW));
74
  auto axis = op_info->GetAttr<int>("axis");
Y
Yan Chunwei 已提交
75

76
  // X node
77 78 79
  std::shared_ptr<Node> x_node = nullptr;
  if (graph->Has(x_name)) {
    x_node = graph->Get(x_name);
80
  } else {
81
    x_node = graph->Add(x_name, *x);
82 83 84
  }

  // Y node
85 86 87
  std::shared_ptr<Node> y_node = nullptr;
  if (graph->Has(y_name)) {
    y_node = graph->Get(y_name);
Y
Yan Chunwei 已提交
88
  } else {
89
    auto y_new_shape = CvtYShape(x_dims, y_dims, axis);
90
    y_node = graph->Add(y_name, *y, y_new_shape);
Y
Yan Chunwei 已提交
91 92
  }

93
  // Elementwise node
94
  std::shared_ptr<Node> elt_node = nullptr;
95 96
  if (op_type == "elementwise_add" ||
      op_type == "fusion_elementwise_add_activation") {
97 98 99 100
    elt_node = graph->Add<ge::op::Add>(out_name);
    auto elt_op = elt_node->data<ge::op::Add>();
    elt_op->set_input_x1(*x_node->data());
    elt_op->set_input_x2(*y_node->data());
101
  } else if (op_type == "elementwise_sub") {
102 103 104 105
    elt_node = graph->Add<ge::op::Sub>(out_name);
    auto elt_op = elt_node->data<ge::op::Sub>();
    elt_op->set_input_x1(*x_node->data());
    elt_op->set_input_x2(*y_node->data());
106
  } else if (op_type == "elementwise_mul") {
107 108 109 110
    elt_node = graph->Add<ge::op::Mul>(out_name);
    auto elt_op = elt_node->data<ge::op::Mul>();
    elt_op->set_input_x(*x_node->data());
    elt_op->set_input_y(*y_node->data());
111
  } else if (op_type == "elementwise_div") {
112 113 114 115
    elt_node = graph->Add<ge::op::RealDiv>(out_name);
    auto elt_op = elt_node->data<ge::op::RealDiv>();
    elt_op->set_input_x1(*x_node->data());
    elt_op->set_input_x2(*y_node->data());
116
  } else {
117 118
    LOG(WARNING) << "[NPU] Unsupported op type: " << op_type;
    return FAILED;
119
  }
Y
Yan Chunwei 已提交
120

121
  // Act node
122 123
  if (op_type == "fusion_elementwise_add_activation") {
    auto act_type = op_info->GetAttr<std::string>("act_type");
124 125 126
    auto act_node = graph->Add<ge::op::Activation>(out_name);
    auto act_op = act_node->data<ge::op::Activation>();
    act_op->set_input_x(*elt_node->data());
127 128
    // TODO(hong19860320) set the coef value for act Ops, such as leaky_relu,
    // clipped_relu etc.
129
    act_op->set_attr_mode(CvtActMode(act_type));
130
  }
131
  return REBUILD_WHEN_SHAPE_CHANGED;
Y
Yan Chunwei 已提交
132 133 134
}

}  // namespace npu
135
}  // namespace subgraph
Y
Yan Chunwei 已提交
136 137 138
}  // namespace lite
}  // namespace paddle

139 140
REGISTER_SUBGRAPH_BRIDGE(elementwise_add,
                         kNPU,
141
                         paddle::lite::subgraph::npu::ElementwiseConverter);
142 143
REGISTER_SUBGRAPH_BRIDGE(fusion_elementwise_add_activation,
                         kNPU,
144
                         paddle::lite::subgraph::npu::ElementwiseConverter);
145 146
REGISTER_SUBGRAPH_BRIDGE(elementwise_sub,
                         kNPU,
147
                         paddle::lite::subgraph::npu::ElementwiseConverter);
148 149
REGISTER_SUBGRAPH_BRIDGE(elementwise_mul,
                         kNPU,
150
                         paddle::lite::subgraph::npu::ElementwiseConverter);
151 152
REGISTER_SUBGRAPH_BRIDGE(elementwise_div,
                         kNPU,
153
                         paddle::lite::subgraph::npu::ElementwiseConverter);