// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/fluid/lite/kernels/arm/softmax_compute.h" #include "paddle/fluid/lite/arm/math/funcs.h" namespace paddle { namespace lite { namespace kernels { namespace arm { void SoftmaxCompute::Run() { auto& param = Param(); const float* din = param.x->data(); float* dout = param.output->mutable_data(); auto dim_x = param.x->dims(); auto rank_x = dim_x.size(); int axis = param.axis; if (axis < 0) { axis += rank_x; } int outer_num = dim_x.Slice(0, axis).production(); int inner_num = dim_x.Slice(axis + 1, rank_x).production(); int axis_size = dim_x[axis]; if (inner_num == 1) { if (axis_size >= 4) { lite::arm::math::softmax_inner1_large_axis(din, dout, outer_num, axis_size); } else { lite::arm::math::softmax_inner1_small_axis(din, dout, outer_num, axis_size); } } else { int compute_size = outer_num * inner_num; if (axis_size == 4 && inner_num % 8 == 0) { lite::arm::math::softmax_inner8_axis4(din, dout, axis_size, inner_num, outer_num); } else if (axis_size == 4 && inner_num % 4 == 0) { lite::arm::math::softmax_inner4_axis4(din, dout, axis_size, inner_num, outer_num); } else { if (inner_num % 8 == 0) { lite::arm::math::softmax_inner8(din, dout, axis_size, inner_num, outer_num); } else if (inner_num % 4 == 0) { lite::arm::math::softmax_inner4(din, dout, axis_size, inner_num, outer_num); } else { lite::arm::math::softmax_basic(din, dout, axis_size, inner_num, outer_num); } } } } TargetType SoftmaxCompute::target() const { return TARGET(kARM); } PrecisionType SoftmaxCompute::precision() const { return PRECISION(kFloat); } } // namespace arm } // namespace kernels } // namespace lite } // namespace paddle REGISTER_LITE_KERNEL(softmax, kARM, kFloat, kNCHW, paddle::lite::kernels::arm::SoftmaxCompute, def) .BindInput("X", {LiteType::GetTensorTy(TARGET(kARM))}) .BindOutput("Out", {LiteType::GetTensorTy(TARGET(kARM))}) .Finalize();