// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "lite/backends/npu/builder.h" #include "lite/kernels/npu/bridges/registry.h" namespace paddle { namespace lite { namespace kernels { namespace npu { namespace bridges { std::vector CvtYShape(const Tensor& x, Tensor* y, int axis) { auto x_dims = x.dims(); CHECK_EQ(x_dims.size(), 4UL) << "[NPU] only support 4-dimension x"; auto y_dims = y->dims(); CHECK_GE(x_dims.size(), y_dims.size()); if (axis < 0) { axis += x_dims.size(); } std::vector y_new_shape(y_dims.Vectorize()); if (y_new_shape.size() == 4UL) { return y_new_shape; } for (int i = 0; i < axis; i++) { y_new_shape.insert(y_new_shape.begin(), 1); } while (y_new_shape.size() < 4) { y_new_shape.push_back(1); } CHECK_EQ(y_new_shape.size(), 4UL); return y_new_shape; } node_map_type ElementwiseConverter( const std::shared_ptr elementwise_op, const node_map_type& inputs_map) { auto scope = elementwise_op->scope(); auto op_info = elementwise_op->op_info(); auto op_type = op_info->Type(); auto unique_op_type = lite::npu::UniqueName(op_type); LOG(INFO) << "[NPU] Converting " + op_type + "..."; auto x_var_name = op_info->Input("X").front(); auto y_var_name = op_info->Input("Y").front(); CHECK(inputs_map.find(x_var_name) != inputs_map.end()); auto axis = op_info->GetAttr("axis"); std::shared_ptr elementwise_node = nullptr; std::shared_ptr x_node = inputs_map.at(x_var_name); std::shared_ptr y_node = nullptr; if (inputs_map.find(y_var_name) != inputs_map.end()) { y_node = inputs_map.at(y_var_name); } else { auto y_const_node = std::make_shared(y_var_name); auto x = scope->FindTensor(x_var_name); auto y = scope->FindMutableTensor(y_var_name); auto y_new_shape = CvtYShape(*x, y, axis); y_const_node->set_attr_value(lite::npu::CvtTensor(y, y_new_shape)); y_node = y_const_node; } lite::npu::OpList::Global().add(x_node); lite::npu::OpList::Global().add(y_node); if (op_type == "elementwise_add" || op_type == "fusion_elementwise_add_activation") { auto elt_node = std::make_shared(unique_op_type); elt_node->set_input_x1(*x_node); elt_node->set_input_x2(*y_node); elementwise_node = elt_node; } else if (op_type == "elementwise_sub") { auto elt_node = std::make_shared(unique_op_type); elt_node->set_input_x1(*x_node); elt_node->set_input_x2(*y_node); elementwise_node = elt_node; } else if (op_type == "elementwise_mul") { auto elt_node = std::make_shared(unique_op_type); elt_node->set_input_x(*x_node); elt_node->set_input_y(*y_node); elementwise_node = elt_node; } else if (op_type == "elementwise_div") { auto elt_node = std::make_shared(unique_op_type); elt_node->set_input_x1(*x_node); elt_node->set_input_x2(*y_node); elementwise_node = elt_node; } else { LOG(FATAL) << "unsupported op type: " << op_type; } lite::npu::OpList::Global().add(elementwise_node); node_map_type outputs_map; if (op_type == "fusion_elementwise_add_activation") { auto act_type = op_info->GetAttr("act_type"); auto act_node = std::make_shared(unique_op_type + "/act"); act_node->set_input_x(*elementwise_node); // TODO(hong19860320) set the coef value for act Ops, such as leaky_relu, // clipped_relu etc. act_node->set_attr_mode(lite::npu::CvtActMode(act_type)); lite::npu::OpList::Global().add(act_node); outputs_map[op_info->Output("Out").front()] = act_node; } else { outputs_map[op_info->Output("Out").front()] = elementwise_node; } return outputs_map; } } // namespace bridges } // namespace npu } // namespace kernels } // namespace lite } // namespace paddle REGISTER_NPU_BRIDGE(elementwise_add, paddle::lite::kernels::npu::bridges::ElementwiseConverter); REGISTER_NPU_BRIDGE(fusion_elementwise_add_activation, paddle::lite::kernels::npu::bridges::ElementwiseConverter); REGISTER_NPU_BRIDGE(elementwise_sub, paddle::lite::kernels::npu::bridges::ElementwiseConverter); REGISTER_NPU_BRIDGE(elementwise_mul, paddle::lite::kernels::npu::bridges::ElementwiseConverter); REGISTER_NPU_BRIDGE(elementwise_div, paddle::lite::kernels::npu::bridges::ElementwiseConverter);