// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "lite/kernels/arm/softmax_compute.h" #include "lite/backends/arm/math/funcs.h" namespace paddle { namespace lite { namespace kernels { namespace arm { void SoftmaxCompute::Run() { auto& param = Param(); const float* din = param.x->data(); float* dout = param.output->mutable_data(); auto x_dims = param.x->dims(); auto x_rank = x_dims.size(); int axis = param.axis; if (axis < 0) { axis += x_rank; } int outer_num = x_dims.Slice(0, axis).production(); int inner_num = x_dims.Slice(axis + 1, x_rank).production(); int axis_size = x_dims[axis]; if (inner_num == 1) { if (axis_size > 4) { lite::arm::math::softmax_inner1_large_axis( din, dout, outer_num, axis_size); } else { lite::arm::math::softmax_inner1_small_axis( din, dout, outer_num, axis_size); } } else { int compute_size = outer_num * inner_num; if (axis_size == 4 && inner_num % 8 == 0) { lite::arm::math::softmax_inner8_axis4( din, dout, axis_size, inner_num, outer_num); } else if (axis_size == 4 && inner_num % 4 == 0) { lite::arm::math::softmax_inner4_axis4( din, dout, axis_size, inner_num, outer_num); } else { if (inner_num % 8 == 0) { lite::arm::math::softmax_inner8( din, dout, axis_size, inner_num, outer_num); } else if (inner_num % 4 == 0) { lite::arm::math::softmax_inner4( din, dout, axis_size, inner_num, outer_num); } else { lite::arm::math::softmax_basic( din, dout, axis_size, inner_num, outer_num); } } } } } // namespace arm } // namespace kernels } // namespace lite } // namespace paddle REGISTER_LITE_KERNEL(softmax, kARM, kFloat, kNCHW, paddle::lite::kernels::arm::SoftmaxCompute, def) .BindInput("X", {LiteType::GetTensorTy(TARGET(kARM))}) .BindOutput("Out", {LiteType::GetTensorTy(TARGET(kARM))}) .Finalize();