diff --git a/src/common/types.cpp b/src/common/types.cpp index 444789237f573f8da3eaf915abf61493967aabf8..cd5e66517f159f5f9db118313b78ccd2a8c216a8 100644 --- a/src/common/types.cpp +++ b/src/common/types.cpp @@ -73,6 +73,9 @@ const char *G_OP_TYPE_SHAPE = "shape"; const char *G_OP_TYPE_SUM = "sum"; const char *G_OP_TYPE_TOP_K = "top_k"; const char *G_OP_TYPE_CAST = "cast"; +const char *G_OP_TYPE_LOG = "log"; +const char *G_OP_TYPE_LOD_RESET = "lod_reset"; +const char *G_OP_TYPE_LESS_THAN = "less_than"; const char *G_OP_TYPE_QUANTIZE = "quantize"; const char *G_OP_TYPE_DEQUANTIZE = "dequantize"; @@ -171,5 +174,8 @@ std::unordered_map< {G_OP_TYPE_SEQUENCE_EXPAND, {{"X", "Y"}, {"Out"}}}, {G_OP_TYPE_SEQUENCE_POOL, {{"X"}, {"Out"}}}, {G_OP_TYPE_SEQUENCE_SOFTMAX, {{"X"}, {"Out"}}}, - {G_OP_TYPE_NORM, {{"X"}, {"Out", "Norm"}}}}; + {G_OP_TYPE_NORM, {{"X"}, {"Out", "Norm"}}}, + {G_OP_TYPE_LOG, {{"X"}, {"Out"}}}, + {G_OP_TYPE_LOD_RESET, {{"X", "Y"}, {"Out"}}}, + {G_OP_TYPE_LESS_THAN, {{"X", "Y"}, {"Out"}}}}; } // namespace paddle_mobile diff --git a/src/common/types.h b/src/common/types.h index 114424fe04add874affb42fe9fca8f0d86bcdd82..9719be623cf7d92147416de1b5ebf276c866edcd 100644 --- a/src/common/types.h +++ b/src/common/types.h @@ -100,6 +100,7 @@ enum ActivationType { LEAKY_RELU = 4, TANH = 5, SIGMOID = 6, + LOG = 7, }; enum PoolingType { @@ -155,6 +156,9 @@ extern const char *G_OP_TYPE_PRELU; extern const char *G_OP_TYPE_SUM; extern const char *G_OP_TYPE_TOP_K; extern const char *G_OP_TYPE_CAST; +extern const char *G_OP_TYPE_LOG; +extern const char *G_OP_TYPE_LOD_RESET; +extern const char *G_OP_TYPE_LESS_THAN; extern const char *G_OP_TYPE_QUANTIZE; extern const char *G_OP_TYPE_DEQUANTIZE; diff --git a/src/framework/load_ops.h b/src/framework/load_ops.h index 88fb360fcc4a135d39fee1e117ba1279d66acae5..1caefe5ae77c9f4328d4d99af9e0b5c3b408d921 100644 --- a/src/framework/load_ops.h +++ b/src/framework/load_ops.h @@ -270,3 +270,12 @@ LOAD_OP1(sequence_expand, CPU); #ifdef SEQUENCE_POOL_OP LOAD_OP1(sequence_pool, CPU); #endif +#ifdef LOG_OP +LOAD_OP1(log, CPU); +#endif +#ifdef LOD_RESET_OP +LOAD_OP1(lod_reset, CPU); +#endif +#ifdef LESS_THAN_OP +LOAD_OP1(less_than, CPU); +#endif diff --git a/src/framework/operator.h b/src/framework/operator.h index 464910b613322451d05adcc772825079d0d8f677..deb573571f8ca0184da0714de54ee98655e78921 100644 --- a/src/framework/operator.h +++ b/src/framework/operator.h @@ -36,13 +36,12 @@ limitations under the License. */ #include "framework/cl/cl_helper.h" #include "framework/cl/cl_scope.h" #endif + namespace paddle_mobile { namespace framework { -using std::string; -using std::vector; template -static T *GetVarValue(const string &key, const VariableNameMap &var_map, +static T *GetVarValue(const std::string &key, const VariableNameMap &var_map, const Scope &scope) { auto var_vec = var_map.at(key); if (!var_vec.empty()) { @@ -56,44 +55,29 @@ static T *GetVarValue(const string &key, const VariableNameMap &var_map, template class OperatorBase { public: - /* - * @b op 基类的实例化方法, op 获取到了 输入、参数以及提前分配好的输出 tensor - * */ OperatorBase(const std::string &type, const VariableNameMap &inputs, const VariableNameMap &outputs, const AttributeMap &attrs, std::shared_ptr scope); virtual ~OperatorBase() {} - void Run(); - std::vector GetOutKeys() const; - std::vector GetInputKeys() const; - virtual void RunImpl() = 0; virtual void Init() = 0; - /* - * @b op 运算所需的输入, 如上一层的输出结果、卷积核 - * */ + virtual void InferShape() const = 0; + virtual void Run(); + virtual void RunImpl() = 0; + + std::vector GetOutKeys() const; + std::vector GetInputKeys() const; + const VariableNameMap &Inputs() const { return inputs_; } - /* - * @b op 的输出, 内存会提前被分配好, 运算结果会被存到分配好的内存内 - * */ const VariableNameMap &Outputs() const { return outputs_; } - /* - * @b op 类型 - * */ const std::string &Type() const { return type_; } - /* - * @b op 运算所需要用到的参数: 如 conv 运算所需要用到的 stride - * */ const AttributeMap &Attrs() const { return attrs_; } + void ClearVariables(const std::vector &var_names) const { if (this->scope_) { this->scope_->EraseVars(var_names); } } - /* - * @b 根据输入形状和参数计算出输出形状 - * */ - virtual void InferShape() const = 0; protected: std::shared_ptr scope_; @@ -106,9 +90,6 @@ class OperatorBase { void CheckAllInputOutputSet() const; }; -/* - * @b 这个类为所有带有运算的 op 的父类, 这个 op 继承与 OperatorBase - * */ template class OperatorWithKernel : public OperatorBase { public: @@ -136,9 +117,6 @@ class OperatorWithKernel : public OperatorBase { ParamType param_; }; -/* - * @b 所有kernel的父类 - * */ template class OpKernelBase { public: @@ -150,11 +128,6 @@ class OpKernelBase { } #endif - /* - * @b 所有kernel 需实现 Compute 方法 - * @p para 这个参数为 kernel 运算时所需要用到参数组成的一个结构体, - * 所有结构体存在与: paddle-mobile/src/operators/op_param.h - * */ #ifdef PADDLE_McOBILE_MALI_GPU OpKernelBase() { acl_op_ = nullptr; } void *GetAclOp() const { return acl_op_; } @@ -177,13 +150,6 @@ class OpKernelBase { #endif }; -#define DEFINE_OP_CONSTRUCTOR(cls, parent_cls) \ - cls(const std::string &type, const ::paddle_mobile::VariableNameMap &inputs, \ - const ::paddle_mobile::VariableNameMap &outputs, \ - const ::paddle_mobile::framework::AttributeMap &attrs, \ - std::shared_ptr<::paddle_mobile::framework::Scope> scope) \ - : parent_cls(type, inputs, outputs, attrs, scope) {} - class FusionOpMatcher { public: FusionOpMatcher() {} @@ -202,12 +168,44 @@ class FusionOpMatcher { virtual std::vector> NeedCheck() { return {}; } - // virtual bool Fusion(); protected: Node node_; std::string type_; std::shared_ptr new_opdesc_; }; +#define DECLARE_OPERATOR(OpName, OpParam, OpKernel) \ + template \ + class OpName##Op : public framework::OperatorWithKernel< \ + DeviceType, OpParam, \ + operators::OpKernel> { \ + public: \ + OpName##Op(const std::string &type, const VariableNameMap &inputs, \ + const VariableNameMap &outputs, \ + const framework::AttributeMap &attrs, \ + std::shared_ptr scope) \ + : framework::OperatorWithKernel, \ + operators::OpKernel>( \ + type, inputs, outputs, attrs, scope) {} \ + \ + void InferShape() const override; \ + }; + +#define DECLARE_KERNEL(OpName, OpParam) \ + template \ + class OpName##Kernel \ + : public framework::OpKernelBase> { \ + public: \ + bool Init(OpParam *param); \ + void Compute(const OpParam ¶m); \ + }; + +#define DEFINE_OP_CONSTRUCTOR(cls, parent_cls) \ + cls(const std::string &type, const ::paddle_mobile::VariableNameMap &inputs, \ + const ::paddle_mobile::VariableNameMap &outputs, \ + const ::paddle_mobile::framework::AttributeMap &attrs, \ + std::shared_ptr<::paddle_mobile::framework::Scope> scope) \ + : parent_cls(type, inputs, outputs, attrs, scope) {} + } // namespace framework } // namespace paddle_mobile diff --git a/src/operators/relu_op.cpp b/src/operators/activation_op.cpp similarity index 50% rename from src/operators/relu_op.cpp rename to src/operators/activation_op.cpp index 560b63058646b379a50184e98ac4b4d5dd43f9fa..bcff87c9276721c19a970eb328fc0a183ed6c003 100644 --- a/src/operators/relu_op.cpp +++ b/src/operators/activation_op.cpp @@ -12,29 +12,40 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#ifdef RELU_OP - -#include "operators/relu_op.h" +#include "operators/activation_op.h" namespace paddle_mobile { namespace operators { -template -void ReluOp::InferShape() const { - auto input_dims = this->param_.InputX()->dims(); - this->param_.Out()->Resize(input_dims); -} +#define DEFINE_ACTIVATION_INFERSHAPE(OpName) \ + template \ + void OpName##Op::InferShape() const { \ + const auto &input_dims = this->param_.InputX()->dims(); \ + this->param_.Out()->Resize(input_dims); \ + } + +#ifdef RELU_OP +DEFINE_ACTIVATION_INFERSHAPE(Relu); +DEFINE_ACTIVATION_INFERSHAPE(Relu6); +#endif // RELU_OP -template -void Relu6Op::InferShape() const { - auto input_dims = this->param_.InputX()->dims(); - this->param_.Out()->Resize(input_dims); -} +#ifdef SIGMOID_OP +DEFINE_ACTIVATION_INFERSHAPE(Sigmoid); +#endif // SIGMOID_OP + +#ifdef TANH_OP +DEFINE_ACTIVATION_INFERSHAPE(Tanh); +#endif // TANH_OP + +#ifdef LOG_OP +DEFINE_ACTIVATION_INFERSHAPE(Log); +#endif // LOG_OP } // namespace operators } // namespace paddle_mobile namespace ops = paddle_mobile::operators; +#ifdef RELU_OP #ifdef PADDLE_MOBILE_CPU REGISTER_OPERATOR_CPU(relu, ops::ReluOp); REGISTER_OPERATOR_CPU(relu6, ops::Relu6Op); @@ -47,5 +58,23 @@ REGISTER_OPERATOR_MALI_GPU(relu, ops::ReluOp); #ifdef PADDLE_MOBILE_CL REGISTER_OPERATOR_CL(relu, ops::ReluOp); #endif - #endif // RELU_OP + +#ifdef SIGMOID_OP +#ifdef PADDLE_MOBILE_CPU +REGISTER_OPERATOR_CPU(sigmoid, ops::SigmoidOp); +#endif +#endif // SIGMOID_OP + +#ifdef TANH_OP +#ifdef PADDLE_MOBILE_CPU +REGISTER_OPERATOR_CPU(tanh, ops::TanhOp); +#endif +#ifdef PADDLE_MOBILE_FPGA +REGISTER_OPERATOR_FPGA(tanh, ops::TanhOp); +#endif +#endif // TANH_OP + +#ifdef LOG_OP +REGISTER_OPERATOR_CPU(log, ops::LogOp); +#endif // LOG_OP diff --git a/src/operators/tanh_op.h b/src/operators/activation_op.h similarity index 57% rename from src/operators/tanh_op.h rename to src/operators/activation_op.h index 0e8226a1eb9074c00b6be87c3192a5f9f10f79bf..cecf22c2255b37d2ee312f8f90df771ce6a571f4 100644 --- a/src/operators/tanh_op.h +++ b/src/operators/activation_op.h @@ -12,8 +12,6 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#ifdef TANH_OP - #pragma once #include @@ -24,21 +22,22 @@ limitations under the License. */ namespace paddle_mobile { namespace operators { -template -class TanhOp : public framework::OperatorWithKernel< - DeviceType, TanhParam, - operators::TanhKernel> { - public: - TanhOp(const std::string &type, const VariableNameMap &inputs, - const VariableNameMap &outputs, const framework::AttributeMap &attrs, - std::shared_ptr scope) - : framework::OperatorWithKernel, - operators::TanhKernel>( - type, inputs, outputs, attrs, scope) {} - void InferShape() const override; -}; +#ifdef RELU_OP +DECLARE_OPERATOR(Relu, ReluParam, ReluKernel); +DECLARE_OPERATOR(Relu6, ReluParam, Relu6Kernel); +#endif -} // namespace operators -} // namespace paddle_mobile +#ifdef SIGMOID_OP +DECLARE_OPERATOR(Sigmoid, SigmoidParam, SigmoidKernel); +#endif +#ifdef TANH_OP +DECLARE_OPERATOR(Tanh, TanhParam, TanhKernel); +#endif + +#ifdef LOG_OP +DECLARE_OPERATOR(Log, ReluParam, LogKernel); #endif + +} // namespace operators +} // namespace paddle_mobile diff --git a/src/operators/tanh_op.cpp b/src/operators/compare_op.cpp similarity index 67% rename from src/operators/tanh_op.cpp rename to src/operators/compare_op.cpp index 77cc980f468e2ec2a192a987496484d935690008..312173a30bad7c5b3762de6f6abc3a735895704c 100644 --- a/src/operators/tanh_op.cpp +++ b/src/operators/compare_op.cpp @@ -12,27 +12,23 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#ifdef TANH_OP - -#include "operators/tanh_op.h" +#include "operators/compare_op.h" namespace paddle_mobile { namespace operators { -template -void TanhOp::InferShape() const { - this->param_.Out()->Resize(this->param_.InputX()->dims()); +#ifdef LESS_THAN_OP +template +void LessThanOp::InferShape() const { + const auto &input_dims = this->param_.input_x_->dims(); + this->param_.output_->Resize(input_dims); } +#endif // LESS_THAN_OP } // namespace operators } // namespace paddle_mobile namespace ops = paddle_mobile::operators; -#ifdef PADDLE_MOBILE_CPU -REGISTER_OPERATOR_CPU(tanh, ops::TanhOp); -#endif -#ifdef PADDLE_MOBILE_FPGA -REGISTER_OPERATOR_FPGA(tanh, ops::TanhOp); -#endif - -#endif +#ifdef LESS_THAN_OP +REGISTER_OPERATOR_CPU(less_than, ops::LessThanOp); +#endif // LESS_THAN_OP diff --git a/src/operators/compare_op.h b/src/operators/compare_op.h new file mode 100644 index 0000000000000000000000000000000000000000..83ae88eae948694a8eef0845da699f1af8e2b8a9 --- /dev/null +++ b/src/operators/compare_op.h @@ -0,0 +1,30 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#pragma once + +#include +#include "framework/operator.h" +#include "operators/kernel/compare_kernel.h" +#include "operators/op_param.h" + +namespace paddle_mobile { +namespace operators { + +#ifdef LESS_THAN_OP +DECLARE_OPERATOR(LessThan, CompareParam, LessThanKernel); +#endif // LESS_THAN_OP + +} // namespace operators +} // namespace paddle_mobile diff --git a/src/operators/kernel/activation_kernel.h b/src/operators/kernel/activation_kernel.h index 9dc8f307c0c988355575160a5f3bb4926537a679..9eaf3fd96737a6bad3448160a41d523965008943 100644 --- a/src/operators/kernel/activation_kernel.h +++ b/src/operators/kernel/activation_kernel.h @@ -20,26 +20,21 @@ limitations under the License. */ namespace paddle_mobile { namespace operators { -#define DECLARE_KERNEL(KernelClass, KernelParam) \ - template \ - class KernelClass \ - : public framework::OpKernelBase> { \ - public: \ - bool Init(KernelParam *param); \ - void Compute(const KernelParam ¶m); \ - }; - #ifdef RELU_OP -DECLARE_KERNEL(ReluKernel, ReluParam); -DECLARE_KERNEL(Relu6Kernel, ReluParam); +DECLARE_KERNEL(Relu, ReluParam); +DECLARE_KERNEL(Relu6, ReluParam); #endif #ifdef SIGMOID_OP -DECLARE_KERNEL(SigmoidKernel, SigmoidParam); +DECLARE_KERNEL(Sigmoid, SigmoidParam); #endif #ifdef TANH_OP -DECLARE_KERNEL(TanhKernel, TanhParam); +DECLARE_KERNEL(Tanh, TanhParam); +#endif + +#ifdef LOG_OP +DECLARE_KERNEL(Log, ReluParam); #endif } // namespace operators diff --git a/src/operators/kernel/arm/activation_kernel.cpp b/src/operators/kernel/arm/activation_kernel.cpp index 5050d3b160addd8686849fa70a82cbf3274d5ff6..da418cf6f3a947f55d21264e568d6c16ea69b1ca 100644 --- a/src/operators/kernel/arm/activation_kernel.cpp +++ b/src/operators/kernel/arm/activation_kernel.cpp @@ -105,7 +105,7 @@ void SigmoidKernel::Compute(const SigmoidParam ¶m) { #ifdef TANH_OP template <> -void TanhKernel::Init(TanhParam *param) { +bool TanhKernel::Init(TanhParam *param) { return true; } @@ -117,5 +117,19 @@ void TanhKernel::Compute(const TanhParam ¶m) { } #endif +#ifdef LOG_OP +template <> +bool LogKernel::Init(ReluParam *param) { + return true; +} + +template <> +void LogKernel::Compute(const ReluParam ¶m) { + const Tensor *input = param.InputX(); + Tensor *output = param.Out(); + ActivationCompute()(input, output); +} +#endif + } // namespace operators } // namespace paddle_mobile diff --git a/src/operators/kernel/arm/compare_kernel.cpp b/src/operators/kernel/arm/compare_kernel.cpp new file mode 100644 index 0000000000000000000000000000000000000000..c2ba6b583a1f80c3545f565464ff614ba4aaf52e --- /dev/null +++ b/src/operators/kernel/arm/compare_kernel.cpp @@ -0,0 +1,209 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#include "operators/kernel/compare_kernel.h" +#if defined(__ARM_NEON__) || defined(__ARM_NEON) +#include +#endif + +namespace paddle_mobile { +namespace operators { + +typedef enum { + LESS_THAN = 0, + LESS_EQUAL = 1, + GREATER_THAN = 2, + GREATER_EQUAL = 3, + EQUAL = 4, + NOT_EQUAL = 5, +} CompareType; + +#if defined(__ARM_NEON__) || defined(__ARM_NEON) +template +inline uint32x4_t vcmpq_f32(const float32x4_t x, const float32x4_t y) { + return vcleq_f32(x, y); +} +#endif + +template +inline uint8_t Compare(const float x, const float y) { + return static_cast(x < y); +} + +template +inline uint8_t Compare(const int64_t x, const int64_t y) { + return static_cast(x < y); +} + +template +struct CompareCompute { + void operator()(const Tensor *X, const Tensor *Y, const int Axis, + Tensor *Out) {} +}; + +template +struct CompareCompute { + void operator()(const Tensor *X, const Tensor *Y, const int Axis, + Tensor *Out) { + const float *x = X->data(); + const float *y = Y->data(); + uint8_t *output = reinterpret_cast(Out->mutable_data()); + const auto &x_dims = X->dims(); + const auto &y_dims = Y->dims(); + /// axis = -1 represent the last dimensions. + int axis = (Axis == -1 ? x_dims.size() - y_dims.size() : Axis); + int batch = 1; + int channels = 1; + int elementwise_num = 1; + for (int i = 0; i < axis; ++i) { + batch *= x_dims[i]; + } + for (int i = 0; i < y_dims.size(); ++i) { + channels *= y_dims[i]; + } + for (int i = y_dims.size() + axis; i < x_dims.size(); ++i) { + elementwise_num *= x_dims[i]; + } + // if elementwise_num == 1, compare rowwise + if (elementwise_num == 1) { + int remain_start = 0; +#if defined(__ARM_NEON__) || defined(__ARM_NEON) + remain_start = channels & 0xfff8; + uint8x8_t __mask = vdup_n_u8(0x1); + for (int i = 0; i < batch; ++i) { + for (int j = 0; j < channels - 7; j += 8) { + int x_offset = i * channels + j; + float32x4_t __x0 = vld1q_f32(x + x_offset); + float32x4_t __x1 = vld1q_f32(x + x_offset + 4); + float32x4_t __y0 = vld1q_f32(y + j); + float32x4_t __y1 = vld1q_f32(y + j + 4); + uint32x4_t __cmp0 = vcmpq_f32(__x0, __y0); + uint32x4_t __cmp1 = vcmpq_f32(__x1, __y1); + uint16x4_t __ncmp0 = vmovn_u32(__cmp0); + uint16x4_t __ncmp1 = vmovn_u32(__cmp1); + uint16x8_t __ncmp = vcombine_u16(__ncmp0, __ncmp1); + uint8x8_t __nncmp = vmovn_u16(__ncmp); + __nncmp = vand_u8(__nncmp, __mask); + vst1_u8(output + x_offset, __nncmp); + } + } +#endif // __ARM_NEON__ + for (int i = 0; i < batch; ++i) { + for (int j = remain_start; j < channels; ++j) { + int x_offset = i * channels + j; + output[x_offset] = Compare(x[x_offset], y[j]); + } + } + } else { + for (int i = 0; i < batch; ++i) { + for (int j = 0; j < channels; ++j) { + int x_offset = (i * channels + j) * elementwise_num; + int y_offset = j * elementwise_num; + int remain_start = 0; +#if defined(__ARM_NEON__) || defined(__ARM_NEON) + remain_start = elementwise_num & 0xfff8; + uint8x8_t __mask = vdup_n_u8(0x1); + for (int k = 0; k < elementwise_num - 7; k += 8) { + float32x4_t __x0 = vld1q_f32(x + x_offset); + float32x4_t __x1 = vld1q_f32(x + x_offset + 4); + float32x4_t __y0 = vld1q_f32(y + y_offset); + uint32x4_t __cmp0 = vcmpq_f32(__x0, __y0); + uint32x4_t __cmp1 = vcmpq_f32(__x1, __y0); + uint16x4_t __ncmp0 = vmovn_u32(__cmp0); + uint16x4_t __ncmp1 = vmovn_u32(__cmp1); + uint16x8_t __ncmp = vcombine_u16(__ncmp0, __ncmp1); + uint8x8_t __nncmp = vmovn_u16(__ncmp); + __nncmp = vand_u8(__nncmp, __mask); + vst1_u8(output + x_offset, __nncmp); + x_offset += 8; + y_offset += 8; + } +#endif // __ARM_NEON__ + for (int k = remain_start; k < elementwise_num; ++k) { + output[x_offset + k] = Compare(x[x_offset + k], y[y_offset]); + } + } + } + } + } +}; + +template +struct CompareCompute { + void operator()(const Tensor *X, const Tensor *Y, const int Axis, + Tensor *Out) { + const int64_t *x = X->data(); + const int64_t *y = Y->data(); + uint8_t *output = reinterpret_cast(Out->mutable_data()); + const auto &x_dims = X->dims(); + const auto &y_dims = Y->dims(); + /// axis = -1 represent the last dimensions. + int axis = (Axis == -1 ? x_dims.size() - y_dims.size() : Axis); + int batch = 1; + int channels = 1; + int elementwise_num = 1; + for (int i = 0; i < axis; ++i) { + batch *= x_dims[i]; + } + for (int i = 0; i < y_dims.size(); ++i) { + channels *= y_dims[i]; + } + for (int i = y_dims.size() + axis; i < x_dims.size(); ++i) { + elementwise_num *= x_dims[i]; + } + // if elementwise_num == 1, compare rowwise + if (elementwise_num == 1) { + for (int i = 0; i < batch; ++i) { + for (int j = 0; j < channels; ++j) { + int x_offset = i * channels + j; + output[x_offset] = Compare(x[x_offset], y[j]); + } + } + } else { + for (int i = 0; i < batch; ++i) { + for (int j = 0; j < channels; ++j) { + int x_offset = (i * channels + j) * elementwise_num; + int y_offset = j * elementwise_num; + for (int k = 0; k < elementwise_num; ++k) { + output[x_offset + k] = Compare(x[x_offset + k], y[y_offset]); + } + } + } + } + } +}; + +#ifdef LESS_THAN_OP +template <> +bool LessThanKernel::Init(CompareParam *param) { + return true; +} + +template <> +void LessThanKernel::Compute(const CompareParam ¶m) { + if (param.input_x_->type() == typeid(int64_t)) { + CompareCompute()(param.input_x_, param.input_y_, + param.axis_, param.output_); + } else if (param.input_x_->type() == typeid(float)) { + CompareCompute()(param.input_x_, param.input_y_, + param.axis_, param.output_); + } else { + PADDLE_MOBILE_THROW_EXCEPTION( + "LessThan only support int64_t and float data type."); + } +} +#endif // LESS_THAN_OP + +} // namespace operators +} // namespace paddle_mobile diff --git a/src/operators/kernel/arm/lod_reset_kernel.cpp b/src/operators/kernel/arm/lod_reset_kernel.cpp new file mode 100644 index 0000000000000000000000000000000000000000..f3bb206447c87941f150c70c2297d8d1c5976231 --- /dev/null +++ b/src/operators/kernel/arm/lod_reset_kernel.cpp @@ -0,0 +1,62 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#ifdef LOD_RESET_OP + +#include "operators/kernel/kernels.h" + +namespace paddle_mobile { +namespace operators { + +template <> +bool LodResetKernel::Init(LodResetParam *param) { + return true; +} + +template <> +void LodResetKernel::Compute(const LodResetParam ¶m) { + const auto *input = param.input_x_; + const auto *lod_t = param.input_y_; + auto *output = param.output_; + + output->ShareDataWith(*input); + + std::vector level0; + if (lod_t) { + if (lod_t->lod().size() > 0) { + output->set_lod(lod_t->lod()); + return; // early return, since lod already set + } else { + auto *lod = lod_t->data(); + level0 = std::vector(lod, lod + lod_t->numel()); + } + } else { + level0 = param.target_lod_; + } + + // cast level0 to size_t + std::vector ulevel0(level0.size(), 0); + for (int i = 0; i < level0.size(); ++i) { + ulevel0[i] = level0[i]; + } + + framework::LoD target_lod; + target_lod.push_back(std::move(ulevel0)); + output->set_lod(target_lod); +} + +} // namespace operators +} // namespace paddle_mobile + +#endif // LOD_RESET_OP diff --git a/src/operators/kernel/arm/sequence_pool_kernel.cpp b/src/operators/kernel/arm/sequence_pool_kernel.cpp index f4e28a0ffbbc13428bd8b4643aaae915f14539bc..352158b973050c99555a82c0d0f02c318b7702ac 100644 --- a/src/operators/kernel/arm/sequence_pool_kernel.cpp +++ b/src/operators/kernel/arm/sequence_pool_kernel.cpp @@ -66,8 +66,9 @@ void SequencePoolImpl(const framework::LoDTensor &input, memcpy(out_ptr, in_ptr, width * sizeof(float)); in_ptr += width; int remain_h = height - 1; + int remain_w_start = 0; #ifdef __ARM_NEON__ - int remain_w_start = width & 0xfffc; + remain_w_start = width & 0xfffc; #endif // __ARM_NEON__ for (int h = 0; h < remain_h; ++h) { #ifdef __ARM_NEON__ @@ -124,9 +125,10 @@ void SequencePoolImpl(const framework::LoDTensor &input, memcpy(out_ptr, in_ptr, width * sizeof(float)); in_ptr += width; int remain_h = height - 1; + int remain_w_start = 0; #ifdef __ARM_NEON__ int loop_w = width >> 2; - int remain_w_start = width & 0xfffc; + remain_w_start = width & 0xfffc; #endif // __ARM_NEON__ for (int h = 0; h < remain_h; ++h) { #ifdef __ARM_NEON__ diff --git a/src/operators/kernel/compare_kernel.h b/src/operators/kernel/compare_kernel.h new file mode 100644 index 0000000000000000000000000000000000000000..0f8a8ac74131054ebca53566dc38c374e9dafe4c --- /dev/null +++ b/src/operators/kernel/compare_kernel.h @@ -0,0 +1,28 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#pragma once + +#include "framework/operator.h" +#include "operators/op_param.h" + +namespace paddle_mobile { +namespace operators { + +#ifdef LESS_THAN_OP +DECLARE_KERNEL(LessThan, CompareParam); +#endif // LESS_THAN_OP + +} // namespace operators +} // namespace paddle_mobile diff --git a/src/operators/kernel/dequant_bn_kernel.h b/src/operators/kernel/dequant_bn_kernel.h index abf2c68e8a965e9741520731c5c34beca8777299..cf759bf69cc959759d770b685cffaef25ac24386 100644 --- a/src/operators/kernel/dequant_bn_kernel.h +++ b/src/operators/kernel/dequant_bn_kernel.h @@ -20,37 +20,28 @@ limitations under the License. */ namespace paddle_mobile { namespace operators { -#define DECLARE_KERNEL(KernelClass, KernelParam) \ - template \ - class KernelClass \ - : public framework::OpKernelBase> { \ - public: \ - bool Init(KernelParam *param); \ - void Compute(const KernelParam ¶m); \ - }; - #ifdef FUSION_DEQUANT_BN_OP -DECLARE_KERNEL(FusionDequantBNKernel, FusionDequantBNParam); +DECLARE_KERNEL(FusionDequantBN, FusionDequantBNParam); #endif #ifdef FUSION_DEQUANT_BN_RELU_OP -DECLARE_KERNEL(FusionDequantBNReluKernel, FusionDequantBNParam); +DECLARE_KERNEL(FusionDequantBNRelu, FusionDequantBNParam); #endif #ifdef FUSION_DEQUANT_ADD_BN_OP -DECLARE_KERNEL(FusionDequantAddBNKernel, FusionDequantAddBNParam); +DECLARE_KERNEL(FusionDequantAddBN, FusionDequantAddBNParam); #endif #ifdef FUSION_DEQUANT_ADD_BN_RELU_OP -DECLARE_KERNEL(FusionDequantAddBNReluKernel, FusionDequantAddBNParam); +DECLARE_KERNEL(FusionDequantAddBNRelu, FusionDequantAddBNParam); #endif #ifdef FUSION_DEQUANT_ADD_BN_QUANT_OP -DECLARE_KERNEL(FusionDequantAddBNQuantKernel, FusionDequantAddBNQuantParam); +DECLARE_KERNEL(FusionDequantAddBNQuant, FusionDequantAddBNQuantParam); #endif #ifdef FUSION_DEQUANT_ADD_BN_RELU_QUANT_OP -DECLARE_KERNEL(FusionDequantAddBNReluQuantKernel, FusionDequantAddBNQuantParam); +DECLARE_KERNEL(FusionDequantAddBNReluQuant, FusionDequantAddBNQuantParam); #endif } // namespace operators diff --git a/src/operators/kernel/kernels.h b/src/operators/kernel/kernels.h index 4f7d50750d7a2ce875d0d848732270b075162e01..668344674c91827775b78b71c4c50ada6d7108b7 100644 --- a/src/operators/kernel/kernels.h +++ b/src/operators/kernel/kernels.h @@ -20,22 +20,17 @@ limitations under the License. */ namespace paddle_mobile { namespace operators { -#define DECLARE_KERNEL(KernelClass, KernelParam) \ - template \ - class KernelClass \ - : public framework::OpKernelBase> { \ - public: \ - bool Init(KernelParam *param); \ - void Compute(const KernelParam ¶m); \ - }; - #ifdef TOP_K_OP -DECLARE_KERNEL(TopKKernel, TopKParam) +DECLARE_KERNEL(TopK, TopKParam); #endif // TOP_K_OP #ifdef CAST_OP -DECLARE_KERNEL(CastKernel, CastParam) +DECLARE_KERNEL(Cast, CastParam); #endif // CAST_OP +#ifdef LOD_RESET_OP +DECLARE_KERNEL(LodReset, LodResetParam); +#endif // LOD_RESET_OP + } // namespace operators } // namespace paddle_mobile diff --git a/src/operators/kernel/sequence_kernels.h b/src/operators/kernel/sequence_kernels.h index 7884d0d475949c8a54b0ecc08fb578807ca2e2d2..ccee8c521690888257092c7c457534ae2149d9d0 100644 --- a/src/operators/kernel/sequence_kernels.h +++ b/src/operators/kernel/sequence_kernels.h @@ -20,25 +20,16 @@ limitations under the License. */ namespace paddle_mobile { namespace operators { -#define DECLARE_KERNEL(KernelClass, KernelParam) \ - template \ - class KernelClass \ - : public framework::OpKernelBase> { \ - public: \ - bool Init(KernelParam *param); \ - void Compute(const KernelParam ¶m); \ - }; - #ifdef SEQUENCE_EXPAND_OP -DECLARE_KERNEL(SequenceExpandKernel, SequenceExpandParam); +DECLARE_KERNEL(SequenceExpand, SequenceExpandParam); #endif // SEQUENCE_EXPAND_OP #ifdef SEQUENCE_POOL_OP -DECLARE_KERNEL(SequencePoolKernel, SequencePoolParam); +DECLARE_KERNEL(SequencePool, SequencePoolParam); #endif // SEQUENCE_POOL_OP #ifdef SEQUENCE_SOFTMAX_OP -DECLARE_KERNEL(SequenceSoftmaxKernel, SoftmaxParam); +DECLARE_KERNEL(SequenceSoftmax, SoftmaxParam); #endif // SEQUENCE_SOFTMAX_OP } // namespace operators diff --git a/src/operators/sigmoid_op.cpp b/src/operators/lod_reset_op.cpp similarity index 70% rename from src/operators/sigmoid_op.cpp rename to src/operators/lod_reset_op.cpp index 04410ece583b63f5b8d9a04342f6418a85475561..1eca733fd95e0893fe811da15290ee5878d1ac77 100644 --- a/src/operators/sigmoid_op.cpp +++ b/src/operators/lod_reset_op.cpp @@ -12,16 +12,17 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#ifdef SIGMOID_OP +#ifdef LOD_RESET_OP -#include "operators/sigmoid_op.h" +#include "operators/lod_reset_op.h" namespace paddle_mobile { namespace operators { -template -void SigmoidOp::InferShape() const { - this->param_.Out()->Resize(this->param_.InputX()->dims()); +template +void LodResetOp::InferShape() const { + const auto &input_dims = this->param_.input_x_->dims(); + this->param_.output_->Resize(input_dims); } } // namespace operators @@ -29,7 +30,7 @@ void SigmoidOp::InferShape() const { namespace ops = paddle_mobile::operators; #ifdef PADDLE_MOBILE_CPU -REGISTER_OPERATOR_CPU(sigmoid, ops::SigmoidOp); +REGISTER_OPERATOR_CPU(lod_reset, ops::LodResetOp); #endif -#endif +#endif // LOD_RESET_OP diff --git a/src/operators/sigmoid_op.h b/src/operators/lod_reset_op.h similarity index 50% rename from src/operators/sigmoid_op.h rename to src/operators/lod_reset_op.h index f918b1a86f806bcba78f67900fe6bb2b56cd6a0f..46932dcfabd1c59b26bf0f1a21b7e927fc5aba2e 100644 --- a/src/operators/sigmoid_op.h +++ b/src/operators/lod_reset_op.h @@ -12,34 +12,21 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#ifdef SIGMOID_OP +#ifdef LOD_RESET_OP #pragma once #include #include "framework/operator.h" -#include "operators/kernel/activation_kernel.h" +#include "operators/kernel/kernels.h" #include "operators/op_param.h" namespace paddle_mobile { namespace operators { -template -class SigmoidOp : public framework::OperatorWithKernel< - DeviceType, SigmoidParam, - operators::SigmoidKernel> { - public: - SigmoidOp(const std::string &type, const VariableNameMap &inputs, - const VariableNameMap &outputs, - const framework::AttributeMap &attrs, - std::shared_ptr scope) - : framework::OperatorWithKernel, - operators::SigmoidKernel>( - type, inputs, outputs, attrs, scope) {} - void InferShape() const override; -}; +DECLARE_OPERATOR(LodReset, LodResetParam, LodResetKernel); } // namespace operators } // namespace paddle_mobile -#endif +#endif // LOD_RESET_OP diff --git a/src/operators/math/activation.h b/src/operators/math/activation.h index 51ce3789785a4e4211298e44312a87ec2de09ea0..08ba4a8f2a7442860a0516f0f6e2726f5d09ec6d 100644 --- a/src/operators/math/activation.h +++ b/src/operators/math/activation.h @@ -86,6 +86,11 @@ inline float32x4_t vActiveq_f32(const float32x4_t &x) { __out = vmulq_n_f32(__out, 2.f); return vsubq_f32(__out, __one); } + +template <> +inline float32x4_t vActiveq_f32(const float32x4_t &x) { + return log_ps(x); +} #endif template @@ -119,6 +124,11 @@ inline float Active(const float &x) { return 2.f / (1.f + exp(-2.f * x)) - 1.f; } +template <> +inline float Active(const float &x) { + return log(x); +} + } // namespace math } // namespace operators } // namespace paddle_mobile diff --git a/src/operators/op_param.h b/src/operators/op_param.h index 385be3b72f233c9a0951f17b8c61c23adc346988..d20075f89195bbbd3a35577b19f84b9bb91b2a1c 100644 --- a/src/operators/op_param.h +++ b/src/operators/op_param.h @@ -2829,5 +2829,55 @@ class SequencePoolParam : public OpParam { }; #endif // SEQUENCE_EXPAND_OP +#ifdef LOD_RESET_OP +template +class LodResetParam : public OpParam { + typedef typename DtypeTensorTrait::gtype GType; + typedef typename DtypeTensorTrait::rtype RType; + + public: + LodResetParam(const VariableNameMap &inputs, const VariableNameMap &outputs, + const AttributeMap &attrs, const Scope &scope) { + input_x_ = InputXFrom(inputs, scope); + output_ = OutFrom(outputs, scope); + input_y_ = nullptr; + if (inputs.count("Y")) { + input_y_ = InputYFrom(inputs, scope); + } else { + target_lod_ = OpParam::GetAttr>("target_lod", attrs); + } + } + + public: + GType *input_x_; + GType *input_y_; + GType *output_; + std::vector target_lod_; +}; +#endif // LOD_RESET_OP + +#ifdef LESS_THAN_OP +template +class CompareParam : public OpParam { + typedef typename DtypeTensorTrait::gtype GType; + typedef typename DtypeTensorTrait::rtype RType; + + public: + CompareParam(const VariableNameMap &inputs, const VariableNameMap &outputs, + const AttributeMap &attrs, const Scope &scope) { + input_x_ = InputXFrom(inputs, scope); + input_y_ = InputYFrom(inputs, scope); + output_ = OutFrom(outputs, scope); + axis_ = OpParam::GetAttr("axis", attrs); + } + + public: + GType *input_x_; + GType *input_y_; + GType *output_; + int axis_; +}; +#endif // LESS_THAN_OP + } // namespace operators } // namespace paddle_mobile diff --git a/src/operators/relu_op.h b/src/operators/relu_op.h deleted file mode 100644 index 9e3f109e74876b9f680dbac8aa2e67dd0bb83709..0000000000000000000000000000000000000000 --- a/src/operators/relu_op.h +++ /dev/null @@ -1,61 +0,0 @@ -/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. */ - -#ifdef RELU_OP - -#pragma once - -#include - -#include "framework/operator.h" -#include "operators/kernel/activation_kernel.h" -#include "operators/op_param.h" - -namespace paddle_mobile { -namespace operators { - -template -class ReluOp : public framework::OperatorWithKernel< - DeviceType, ReluParam, - operators::ReluKernel> { - public: - ReluOp(const std::string &type, const VariableNameMap &inputs, - const VariableNameMap &outputs, const framework::AttributeMap &attrs, - std::shared_ptr scope) - : framework::OperatorWithKernel, - operators::ReluKernel>( - type, inputs, outputs, attrs, scope) {} - - void InferShape() const override; -}; - -template -class Relu6Op : public framework::OperatorWithKernel< - DeviceType, ReluParam, - operators::Relu6Kernel> { - public: - Relu6Op(const std::string &type, const VariableNameMap &inputs, - const VariableNameMap &outputs, const framework::AttributeMap &attrs, - std::shared_ptr scope) - : framework::OperatorWithKernel, - operators::Relu6Kernel>( - type, inputs, outputs, attrs, scope) {} - - void InferShape() const override; -}; - -} // namespace operators -} // namespace paddle_mobile - -#endif diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt index e90fe2c904868d0145a889033720e4948a1f3c33..75ad5348aa0743c081e2df3a59c190fa4c9a64f9 100644 --- a/test/CMakeLists.txt +++ b/test/CMakeLists.txt @@ -238,12 +238,21 @@ if (NOT FOUND_MATCH) ADD_EXECUTABLE(test-relu6-op operators/test_relu6_op.cpp test_helper.h test_include.h) target_link_libraries(test-relu6-op paddle-mobile) + ADD_EXECUTABLE(test-tanh-op operators/test_tanh_op.cpp test_helper.h test_include.h) + target_link_libraries(test-tanh-op paddle-mobile) + + ADD_EXECUTABLE(test-log-op operators/test_log_op.cpp test_helper.h test_include.h) + target_link_libraries(test-log-op paddle-mobile) + ADD_EXECUTABLE(test-topk-op operators/test_topk_op.cpp test_helper.h test_include.h) target_link_libraries(test-topk-op paddle-mobile) ADD_EXECUTABLE(test-cast-op operators/test_cast_op.cpp test_helper.h test_include.h) target_link_libraries(test-cast-op paddle-mobile) + ADD_EXECUTABLE(test-less-than-op operators/test_less_than_op.cpp test_helper.h test_include.h) + target_link_libraries(test-less-than-op paddle-mobile) + # gen test ADD_EXECUTABLE(test-fc-op operators/test_fusion_fc_op.cpp test_helper.h test_include.h) target_link_libraries(test-fc-op paddle-mobile) diff --git a/test/executor_for_test.h b/test/executor_for_test.h index 8edac50f69d4f96a45cefb4ec7555b7f518ca36f..947f41032030f51e7522f4305ac395dd0c1fc211 100644 --- a/test/executor_for_test.h +++ b/test/executor_for_test.h @@ -20,12 +20,11 @@ limitations under the License. */ #include "common/log.h" #include "framework/executor.h" #include "framework/op_registry.h" +#include "operators/activation_op.h" #include "operators/conv_op.h" #include "operators/elementwise_add_op.h" #include "operators/pool_op.h" -#include "operators/relu_op.h" #include "operators/reshape_op.h" -#include "operators/sigmoid_op.h" #include "operators/softmax_op.h" #include "operators/transpose_op.h" diff --git a/test/net/test_benchmark.cpp b/test/net/test_benchmark.cpp index a95d6c850e80216f9996bc8d582c0646eea1b78b..31a0850c4d531d13f7960d9857b3721ee69c6d27 100644 --- a/test/net/test_benchmark.cpp +++ b/test/net/test_benchmark.cpp @@ -43,7 +43,8 @@ int main(int argc, char* argv[]) { std::shared_ptr output; std::vector dims{1, 3, 224, 224}; if (feed_shape) { - sscanf(feed_shape, "%d,%d,%d,%d", &dims[0], &dims[1], &dims[2], &dims[3]); + sscanf(feed_shape, "%ld,%ld,%ld,%ld", &dims[0], &dims[1], &dims[2], + &dims[3]); } std::cout << "feed shape: [" << dims[0] << ", " << dims[1] << ", " << dims[2] << ", " << dims[3] << "]\n"; diff --git a/test/operators/test_less_than_op.cpp b/test/operators/test_less_than_op.cpp new file mode 100644 index 0000000000000000000000000000000000000000..5c8fa8910d9abfb6ac0a834d9d00274b35fc790b --- /dev/null +++ b/test/operators/test_less_than_op.cpp @@ -0,0 +1,122 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#include +#include +#include "../test_include.h" +#include "operators/compare_op.h" + +namespace paddle_mobile { + +template +void LessThan(const framework::Tensor *X, const framework::Tensor *Y, + const int Axis, framework::Tensor *Out) { + const T *x = X->data(); + const T *y = Y->data(); + bool *output = Out->mutable_data(); + const auto &x_dims = X->dims(); + const auto &y_dims = Y->dims(); + /// axis = -1 represent the last dimensions. + int axis = (Axis == -1 ? x_dims.size() - y_dims.size() : Axis); + int batch = 1; + int channels = 1; + int elementwise_num = 1; + for (int i = 0; i < axis; ++i) { + batch *= x_dims[i]; + } + for (int i = 0; i < y_dims.size(); ++i) { + channels *= y_dims[i]; + } + for (int i = y_dims.size() + axis; i < x_dims.size(); ++i) { + elementwise_num *= x_dims[i]; + } + // less than + for (int i = 0; i < batch; ++i) { + for (int j = 0; j < channels; ++j) { + int x_offset = (i * channels + j) * elementwise_num; + int y_offset = j * elementwise_num; + for (int k = 0; k < elementwise_num; ++k) { + output[x_offset + k] = (x[x_offset + k] < y[y_offset]); + } + } + } +} + +template +int TestLessThanOp(const std::vector &x_shape, + const std::vector &y_shape, const int axis) { + framework::DDim xdims = framework::make_ddim(x_shape); + framework::DDim ydims = framework::make_ddim(y_shape); + VariableNameMap inputs; + VariableNameMap outputs; + auto scope = std::make_shared(); + inputs["X"] = std::vector({"inputx"}); + inputs["Y"] = std::vector({"inputy"}); + outputs["Out"] = std::vector({"output"}); + + auto inputx_var = scope.get()->Var("inputx"); + auto inputx = inputx_var->template GetMutable(); + SetupTensor(inputx, xdims, static_cast(-100), static_cast(100)); + auto inputy_var = scope.get()->Var("inputy"); + auto inputy = inputy_var->template GetMutable(); + SetupTensor(inputy, ydims, static_cast(-100), static_cast(100)); + + auto output_var = scope.get()->Var("output"); + + framework::AttributeMap attrs; + attrs["axis"].Set(axis); + auto *op = new operators::LessThanOp("less_than", inputs, outputs, + attrs, scope); + op->InferShape(); + op->Init(); + op->Run(); + + auto output = output_var->template Get(); + + framework::Tensor output_cmp; + bool *output_cmp_data = output_cmp.mutable_data(output->dims()); + LessThan(inputx, inputy, axis, &output_cmp); + + const bool *output_data = output->data(); + for (int i = 0; i < output->numel(); ++i) { + if (output_data[i] != output_cmp_data[i]) { + LOG(kLOG_INFO) << "output_data[" << i << "] = " << output_data[i] + << ", output_cmp_data[" << i + << "] = " << output_cmp_data[i]; + delete op; + exit(1); + } + } + delete op; + return 0; +} + +} // namespace paddle_mobile + +int main() { + paddle_mobile::TestLessThanOp({1, 2, 3}, {1, 2, 3}, 0); + paddle_mobile::TestLessThanOp({10, 2, 1}, {10, 2, 1}, 0); + + paddle_mobile::TestLessThanOp({2, 10, 1}, {1, 10, 1}, 1); + paddle_mobile::TestLessThanOp({10, 2, 1}, {1, 2, 1}, 1); + + paddle_mobile::TestLessThanOp({1, 2, 3}, {1, 2, 3}, 0); + paddle_mobile::TestLessThanOp({10, 2, 1}, {10, 2, 1}, 0); + + paddle_mobile::TestLessThanOp({2, 10, 1}, {1, 10, 1}, 1); + paddle_mobile::TestLessThanOp({10, 2, 1}, {1, 2, 1}, 1); + + std::cout << "test less_than op pass." << std::endl; + return 0; +} diff --git a/test/operators/test_log_op.cpp b/test/operators/test_log_op.cpp new file mode 100644 index 0000000000000000000000000000000000000000..8d675f06decc902365c32d797b432923933656f7 --- /dev/null +++ b/test/operators/test_log_op.cpp @@ -0,0 +1,81 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#include +#include +#include "../test_include.h" +#include "operators/activation_op.h" + +namespace paddle_mobile { + +void Log(const framework::Tensor *X, framework::Tensor *Y) { + const float *x = X->data(); + float *y = Y->mutable_data(); + + for (int i = 0; i < X->numel(); ++i) { + y[i] = log(x[i]); + } +} + +int TestLogOp(const std::vector input_shape) { + framework::DDim dims = framework::make_ddim(input_shape); + VariableNameMap inputs; + VariableNameMap outputs; + auto scope = std::make_shared(); + inputs["X"] = std::vector({"input"}); + outputs["Out"] = std::vector({"output"}); + + auto input_var = scope.get()->Var("input"); + auto input = input_var->template GetMutable(); + SetupTensor(input, dims, 0.0001, 100.0); + + auto output_var = scope.get()->Var("output"); + + framework::AttributeMap attrs; + auto *op = + new operators::LogOp("log", inputs, outputs, attrs, scope); + op->InferShape(); + op->Init(); + op->Run(); + + auto output = output_var->template Get(); + + framework::Tensor output_cmp; + float *output_cmp_data = output_cmp.mutable_data(output->dims()); + Log(input, &output_cmp); + + const float *output_data = output->data(); + for (int i = 0; i < output->numel(); ++i) { + float gap = output_data[i] - output_cmp_data[i]; + if (std::abs(gap / (output_data[i] + 1e-5)) > 1e-3) { + LOG(kLOG_INFO) << "output_data[" << i << "] = " << output_data[i] + << ", output_cmp_data[" << i + << "] = " << output_cmp_data[i]; + delete op; + exit(1); + } + } + delete op; + return 0; +} + +} // namespace paddle_mobile + +int main() { + paddle_mobile::TestLogOp({1, 1, 2, 3}); + paddle_mobile::TestLogOp({1, 3, 11, 22}); + paddle_mobile::TestLogOp({1, 32, 112, 112}); + std::cout << "test log op pass." << std::endl; + return 0; +} diff --git a/test/operators/test_relu6_op.cpp b/test/operators/test_relu6_op.cpp index 2d2885f3ea94f522adbccefe5010662920a367a4..ceaabcb31343629fa52aef996e3906458b1e011a 100644 --- a/test/operators/test_relu6_op.cpp +++ b/test/operators/test_relu6_op.cpp @@ -15,7 +15,7 @@ limitations under the License. */ #include #include #include "../test_include.h" -#include "operators/relu_op.h" +#include "operators/activation_op.h" namespace paddle_mobile { diff --git a/test/operators/test_relu_op.cpp b/test/operators/test_relu_op.cpp index c38a16e684029e22a3f1b489c1a83776e91382c2..e82e681e3128177300f54326bc346313024644ef 100644 --- a/test/operators/test_relu_op.cpp +++ b/test/operators/test_relu_op.cpp @@ -15,7 +15,7 @@ limitations under the License. */ #include #include #include "../test_include.h" -#include "operators/relu_op.h" +#include "operators/activation_op.h" namespace paddle_mobile { diff --git a/test/operators/test_sigmoid_op.cpp b/test/operators/test_sigmoid_op.cpp index 55ea43e1ea8e196c7397b7739cd83183ed7e8852..40f6461a2cfdfb67b135a5a3a22c29bf19750189 100644 --- a/test/operators/test_sigmoid_op.cpp +++ b/test/operators/test_sigmoid_op.cpp @@ -12,15 +12,70 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ -#include "../test_helper.h" +#include +#include +#include "../test_include.h" +#include "operators/activation_op.h" -int main() { - paddle_mobile::framework::Tensor input; - paddle_mobile::framework::Tensor output; - SetupTensor(&input, {1, 4, 60, 60}, static_cast(0), - static_cast(1)); +namespace paddle_mobile { + +void Sigmoid(const framework::Tensor *X, framework::Tensor *Y) { + const float *x = X->data(); + float *y = Y->mutable_data(); + + for (int i = 0; i < X->numel(); ++i) { + y[i] = 1.f / (1.f + exp(-x[i])); + } +} + +int TestSigmoidOp(const std::vector input_shape) { + framework::DDim dims = framework::make_ddim(input_shape); + VariableNameMap inputs; + VariableNameMap outputs; + auto scope = std::make_shared(); + inputs["X"] = std::vector({"input"}); + outputs["Out"] = std::vector({"output"}); + + auto input_var = scope.get()->Var("input"); + auto input = input_var->template GetMutable(); + SetupTensor(input, dims, -100.0, 100.0); + + auto output_var = scope.get()->Var("output"); + + framework::AttributeMap attrs; + auto *op = new operators::SigmoidOp("sigmoid", inputs, outputs, + attrs, scope); + op->InferShape(); + op->Init(); + op->Run(); - auto out_ddim = paddle_mobile::framework::make_ddim({1, 4, 60, 60}); - output.Resize(out_ddim); + auto output = output_var->template Get(); + + framework::Tensor output_cmp; + float *output_cmp_data = output_cmp.mutable_data(output->dims()); + Sigmoid(input, &output_cmp); + + const float *output_data = output->data(); + for (int i = 0; i < output->numel(); ++i) { + float gap = output_data[i] - output_cmp_data[i]; + if (std::abs(gap / (output_data[i] + 1e-5)) > 1e-3) { + LOG(kLOG_INFO) << "output_data[" << i << "] = " << output_data[i] + << ", output_cmp_data[" << i + << "] = " << output_cmp_data[i]; + delete op; + exit(1); + } + } + delete op; + return 0; +} + +} // namespace paddle_mobile + +int main() { + paddle_mobile::TestSigmoidOp({1, 1, 2, 3}); + paddle_mobile::TestSigmoidOp({1, 3, 11, 22}); + paddle_mobile::TestSigmoidOp({1, 32, 112, 112}); + std::cout << "test sigmoid op pass." << std::endl; return 0; } diff --git a/test/operators/test_tanh_op.cpp b/test/operators/test_tanh_op.cpp new file mode 100644 index 0000000000000000000000000000000000000000..b8006931075d742724d18c3af3627f780a7bf454 --- /dev/null +++ b/test/operators/test_tanh_op.cpp @@ -0,0 +1,81 @@ +/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. + +Licensed under the Apache License, Version 2.0 (the "License"); +you may not use this file except in compliance with the License. +You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + +Unless required by applicable law or agreed to in writing, software +distributed under the License is distributed on an "AS IS" BASIS, +WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +See the License for the specific language governing permissions and +limitations under the License. */ + +#include +#include +#include "../test_include.h" +#include "operators/activation_op.h" + +namespace paddle_mobile { + +void Tanh(const framework::Tensor *X, framework::Tensor *Y) { + const float *x = X->data(); + float *y = Y->mutable_data(); + + for (int i = 0; i < X->numel(); ++i) { + y[i] = 2.f / (1.f + exp(-2.f * x[i])) - 1.f; + } +} + +int TestTanhOp(const std::vector input_shape) { + framework::DDim dims = framework::make_ddim(input_shape); + VariableNameMap inputs; + VariableNameMap outputs; + auto scope = std::make_shared(); + inputs["X"] = std::vector({"input"}); + outputs["Out"] = std::vector({"output"}); + + auto input_var = scope.get()->Var("input"); + auto input = input_var->template GetMutable(); + SetupTensor(input, dims, -100.0, 100.0); + + auto output_var = scope.get()->Var("output"); + + framework::AttributeMap attrs; + auto *op = + new operators::TanhOp("tanh", inputs, outputs, attrs, scope); + op->InferShape(); + op->Init(); + op->Run(); + + auto output = output_var->template Get(); + + framework::Tensor output_cmp; + float *output_cmp_data = output_cmp.mutable_data(output->dims()); + Tanh(input, &output_cmp); + + const float *output_data = output->data(); + for (int i = 0; i < output->numel(); ++i) { + float gap = output_data[i] - output_cmp_data[i]; + if (std::abs(gap / (output_data[i] + 1e-5)) > 1e-3) { + LOG(kLOG_INFO) << "output_data[" << i << "] = " << output_data[i] + << ", output_cmp_data[" << i + << "] = " << output_cmp_data[i]; + delete op; + exit(1); + } + } + delete op; + return 0; +} + +} // namespace paddle_mobile + +int main() { + paddle_mobile::TestTanhOp({1, 1, 2, 3}); + paddle_mobile::TestTanhOp({1, 3, 11, 22}); + paddle_mobile::TestTanhOp({1, 32, 112, 112}); + std::cout << "test sigmoid op pass." << std::endl; + return 0; +} diff --git a/tools/build.sh b/tools/build.sh index 5cb0887e3aa43038f1cc58c915f1e6809dd4ac89..117e74adeafae185693c751462454ecbefbd48ca 100755 --- a/tools/build.sh +++ b/tools/build.sh @@ -173,7 +173,7 @@ build_error() { } if [ $# -lt 1 ]; then - echo "error: target missing!" + echo "error: target missing!" echo "available targets: ios|android" echo "sample usage: ./build.sh android" else diff --git a/tools/op.cmake b/tools/op.cmake index e98e95e4ed29ced5044315dd4fb59a1866964a82..c29d6eb0f4d1324be75a69b0c29aac56b76ed421 100644 --- a/tools/op.cmake +++ b/tools/op.cmake @@ -276,6 +276,10 @@ if(NOT FOUND_MATCH) set(SEQUENCE_EXPAND_OP ON) set(SEQUENCE_POOL_OP ON) set(SEQUENCE_SOFTMAX_OP ON) + set(LOG_OP ON) + set(TANH_OP ON) + set(LOD_RESET_OP ON) + set(LESS_THAN_OP ON) endif() # option(BATCHNORM_OP "" ON) @@ -512,6 +516,15 @@ endif() if (SEQUENCE_SOFTMAX_OP) add_definitions(-DSEQUENCE_SOFTMAX_OP) endif() +if (LOG_OP) + add_definitions(-DLOG_OP) +endif() +if (LOD_RESET_OP) + add_definitions(-DLOD_RESET_OP) +endif() +if (LESS_THAN_OP) + add_definitions(-DLESS_THAN_OP) +endif() if (TANH_OP) add_definitions(-DTANH_OP)