// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/fluid/inference/anakin/convert/sum.h" #include #include #include using anakin::PTuple; namespace paddle { namespace inference { namespace anakin { template void SumOpConverter::operator()( const framework::proto::OpDesc &op, const framework::BlockDesc &block_desc, const framework::Scope &scope, bool test_mode) { framework::OpDesc op_desc(op, nullptr); PADDLE_ENFORCE_EQ(op_desc.Input("X").size(), 2); PADDLE_ENFORCE_EQ(op_desc.Output("Out").size(), 1); auto input_names = op_desc.Input("X"); auto out_name = op_desc.Output("Out").front(); auto op_name = op_desc.Type() + ":" + op_desc.Output("Out").front(); std::vector coeff = {1, 1}; std::string elementwise_type = "Add"; this->engine_->AddOp(op_name, "Eltwise", input_names, {out_name}); this->engine_->template AddOpAttr>(op_name, "coeff", coeff); this->engine_->template AddOpAttr(op_name, "type", elementwise_type); } } // namespace anakin } // namespace inference } // namespace paddle #ifdef PADDLE_WITH_CUDA using sum_nv_fp32 = ::paddle::inference::anakin::SumOpConverter<::anakin::saber::NV, ::anakin::Precision::FP32>; using sum_nv_int8 = ::paddle::inference::anakin::SumOpConverter<::anakin::saber::NV, ::anakin::Precision::INT8>; REGISTER_CUDA_ANAKIN_OP_CONVERTER(sum, sum_nv_fp32); REGISTER_CUDA_INT8_ANAKIN_OP_CONVERTER(sum, sum_nv_int8); #endif using sum_cpu_fp32 = ::paddle::inference::anakin::SumOpConverter<::anakin::saber::X86, ::anakin::Precision::FP32>; using sum_cpu_int8 = ::paddle::inference::anakin::SumOpConverter<::anakin::saber::X86, ::anakin::Precision::INT8>; REGISTER_CPU_ANAKIN_OP_CONVERTER(sum, sum_cpu_fp32); REGISTER_CPU_INT8_ANAKIN_OP_CONVERTER(sum, sum_cpu_int8);