/* Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #pragma once #include #include #include #include #include #include "paddle/phi/api/ext/dll_decl.h" #include "paddle/phi/api/ext/exception.h" #include "paddle/phi/api/include/tensor.h" #include "paddle/utils/any.h" /** * Op Meta Info Related Define. * * Used to maintain operator core information. * */ namespace paddle { namespace framework { class PADDLE_API OpMetaInfoHelper; } // namespace framework using Tensor = paddle::experimental::Tensor; ///////////////// Util Marco Define //////////////// #define PD_DISABLE_COPY_AND_ASSIGN(classname) \ private: \ classname(const classname&) = delete; \ classname(classname&&) = delete; \ classname& operator=(const classname&) = delete; \ classname& operator=(classname&&) = delete #define STATIC_ASSERT_GLOBAL_NAMESPACE(uniq_name, msg) \ struct __test_global_namespace_##uniq_name##__ {}; \ static_assert(std::is_same<::__test_global_namespace_##uniq_name##__, \ __test_global_namespace_##uniq_name##__>::value, \ msg) ///////////////// Util Define and Function //////////////// constexpr char kGradTensorSuffix[] = "@GRAD"; constexpr char kTensorVectorSuffix[] = "@VECTOR"; // Used for Construct Grad Tensor name inline std::string Grad(const std::string& t_name) { std::string result; result.reserve(t_name.size() + 5U); result += t_name; result += kGradTensorSuffix; return result; } // Used for Construct std::vector name inline std::string Vec(const std::string& t_name) { std::string result; result.reserve(t_name.size() + 7U); result += t_name; result += kTensorVectorSuffix; return result; } PADDLE_API void AssignTensorImpl(const Tensor& src, Tensor* dst); ////////////////////// Kernel Context //////////////////////// class PADDLE_API CustomOpKernelContext { public: CustomOpKernelContext() = default; void EmplaceBackInput(Tensor&& input); void EmplaceBackInputs(std::vector&& inputs); void EmplaceBackOutput(Tensor&& output); void EmplaceBackOutputs(std::vector&& outputs); void EmplaceBackAttr(paddle::any attr); const std::pair& InputRangeAt(size_t idx) const; const std::pair& OutputRangeAt(size_t idx) const; const Tensor& InputAt(size_t idx) const; std::vector InputsBetween(size_t start, size_t end) const; Tensor* MutableOutputAt(size_t idx); std::vector MutableOutputBetweeen(size_t start, size_t end); std::vector* AllMutableOutput(); template AttrType AttrAt(size_t idx) const { try { return paddle::any_cast(attrs_.at(idx)); } catch (paddle::bad_any_cast&) { PD_THROW("Attribute cast error in Custom Op Kernel Context."); } } private: // TODO(chenweihang): replaced be SmallVector std::vector inputs_; std::vector outputs_; std::vector attrs_; std::vector> input_range_; std::vector> output_range_; }; ////////////////////// Kernel Function (PD_KERNEL) //////////////////////// // Record Op kernel core function using KernelFunc = void (*)(CustomOpKernelContext*); #define PD_SPECIALIZE_ComputeCallHelper(attr_type) \ template \ struct ComputeCallHelper { \ template \ static void Compute(CustomOpKernelContext* ctx, \ const PreviousArgs&... pargs) { \ attr_type arg = ctx->AttrAt(attr_idx); \ ComputeCallHelper< \ Tail...>::template Compute(ctx, \ pargs..., \ arg); \ } \ } template struct TypeTag {}; template struct KernelFuncImpl; template struct KernelFuncImpl { static void Compute(CustomOpKernelContext* ctx) { ComputeCallHelper>::template Compute<0, 0, 0>(ctx); } private: template struct ComputeCallHelper; template struct ComputeCallHelper { template static void Compute(CustomOpKernelContext* ctx, const PreviousArgs&... pargs) { auto& range = ctx->InputRangeAt(in_idx); auto& arg = ctx->InputAt(range.first); ComputeCallHelper< Tail...>::template Compute(ctx, pargs..., arg); } }; template struct ComputeCallHelper&, Tail...> { template static void Compute(CustomOpKernelContext* ctx, const PreviousArgs&... pargs) { auto& range = ctx->InputRangeAt(in_idx); auto arg = ctx->InputsBetween(range.first, range.second); ComputeCallHelper< Tail...>::template Compute(ctx, pargs..., arg); } }; PD_SPECIALIZE_ComputeCallHelper(bool); PD_SPECIALIZE_ComputeCallHelper(int); PD_SPECIALIZE_ComputeCallHelper(float); PD_SPECIALIZE_ComputeCallHelper(int64_t); PD_SPECIALIZE_ComputeCallHelper(const std::string&); PD_SPECIALIZE_ComputeCallHelper(const std::vector&); PD_SPECIALIZE_ComputeCallHelper(const std::vector&); PD_SPECIALIZE_ComputeCallHelper(const std::vector&); PD_SPECIALIZE_ComputeCallHelper(const std::vector&); // TODO(chenweihang): support other attribute type if needed. // Why not support other attribute type here? // - boost::blank, std::vector and std::vector // are not used in op // - BlockDesc* and std::vector are used in framework // NOTE(chenweihang): Used to be compatible with the 2.0.1 released // interface, and will be deprecated in the future PD_SPECIALIZE_ComputeCallHelper(const bool&); PD_SPECIALIZE_ComputeCallHelper(const int&); PD_SPECIALIZE_ComputeCallHelper(const float&); PD_SPECIALIZE_ComputeCallHelper(const int64_t&); // NOTE(chenweihang): Used to be compatible with the 2.1 released // interface, but not recommended PD_SPECIALIZE_ComputeCallHelper(std::string); PD_SPECIALIZE_ComputeCallHelper(std::vector); PD_SPECIALIZE_ComputeCallHelper(std::vector); PD_SPECIALIZE_ComputeCallHelper(std::vector); PD_SPECIALIZE_ComputeCallHelper(std::vector); template struct ComputeCallHelper { template static void Compute(CustomOpKernelContext* ctx, const PreviousArgs&... pargs) { auto& range = ctx->OutputRangeAt(out_idx); auto* arg = ctx->MutableOutputAt(range.first); ComputeCallHelper< Tail...>::template Compute(ctx, pargs..., arg); } }; // TODO(chenweihang): What is the appropriate output form? // std::vector*? or std::vector? or std::vector* template struct ComputeCallHelper, Tail...> { template static void Compute(CustomOpKernelContext* ctx, const PreviousArgs&... pargs) { auto& range = ctx->OutputRangeAt(out_idx); auto arg = ctx->MutableOutputBetweeen(range.first, range.second); ComputeCallHelper< Tail...>::template Compute(ctx, pargs..., arg); } }; template struct ComputeReturnHelper; // For compatibility with the original custom op form template struct ComputeReturnHelper> { static void Compute(CustomOpKernelContext* ctx, const Args&... args) { static_assert(out_idx == 0, "If return std::vector in Custom OpKernel, " "you cannot pass output by kernel funciton argument."); auto outs = impl_fn(args...); auto* orig_outs = ctx->AllMutableOutput(); PD_CHECK(orig_outs->size() == outs.size(), "The number of element in custom operator outputs is wrong, " "expected contains ", orig_outs->size(), " Tensors, but actually contains ", outs.size(), " Tensors."); for (size_t i = 0; i < outs.size(); ++i) { AssignTensorImpl(outs.at(i), &(orig_outs->at(i))); } } }; template struct ComputeReturnHelper { static void Compute(CustomOpKernelContext* ctx, const Args&... args) { static_assert(out_idx > 0, "Custom OpKernel has no output."); impl_fn(args...); } }; // end: base template template struct ComputeCallHelper> { template static void Compute(CustomOpKernelContext* ctx, const PreviousArgs&... pargs) { ComputeReturnHelper::Compute(ctx, pargs...); } }; }; #define PD_KERNEL(...) \ ::paddle::KernelFuncImpl::Compute /////////////// InferShape Function (PD_INFER_SHAPE) /////////////// // Record Op infershape core function using InferShapeFunc = std::vector> (*)( const std::vector>& input_shapes, const std::vector>>& vec_input_shapes, const std::vector& attrs); #define PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPE(input_type) \ template \ struct InferShapeCallHelper { \ template \ static Return InferShape( \ const std::vector>& input_shapes, \ const std::vector>>& \ vec_input_shapes, \ const std::vector& attrs, \ const PreviousArgs&... pargs) { \ input_type arg = input_shapes[in_idx]; \ return InferShapeCallHelper::template InferShape( \ input_shapes, vec_input_shapes, attrs, pargs..., arg); \ } \ } #define PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPES(input_type) \ template \ struct InferShapeCallHelper { \ template \ static Return InferShape( \ const std::vector>& input_shapes, \ const std::vector>>& \ vec_input_shapes, \ const std::vector& attrs, \ const PreviousArgs&... pargs) { \ input_type arg = vec_input_shapes[vec_in_idx]; \ return InferShapeCallHelper:: \ template InferShape( \ input_shapes, vec_input_shapes, attrs, pargs..., arg); \ } \ } #define PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(attr_type) \ template \ struct InferShapeCallHelper { \ template \ static Return InferShape( \ const std::vector>& input_shapes, \ const std::vector>>& \ vec_input_shapes, \ const std::vector& attrs, \ const PreviousArgs&... pargs) { \ try { \ attr_type arg = paddle::any_cast(attrs[attr_idx]); \ return InferShapeCallHelper:: \ template InferShape( \ input_shapes, vec_input_shapes, attrs, pargs..., arg); \ } catch (paddle::bad_any_cast&) { \ PD_THROW( \ "Attribute cast error in custom operator InferShapeFn. " \ "Expected " #attr_type \ " value. InferShapeFn's attribute list must be exactly same as " \ "Forward " \ "KernelFn's attribute list except std::vector " \ "attribute."); \ } \ } \ } template struct InferShapeFuncImpl; template struct InferShapeFuncImpl { static Return InferShape( const std::vector>& input_shapes, const std::vector>>& vec_input_shapes, const std::vector& attrs) { return InferShapeCallHelper>::template InferShape<0, 0, 0>( input_shapes, vec_input_shapes, attrs); } private: template struct InferShapeCallHelper; PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPE(const std::vector&); PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPES( const std::vector>&); // NOTE(chenweihang): Used to be compatible with the 2.0.1 released // interface, and will be deprecated in the future PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPE(std::vector); PD_SPECIALIZE_InferShapeCallHelper_FOR_SHAPES( std::vector>); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(bool); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(int); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(float); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(int64_t); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const std::string&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const std::vector&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const std::vector&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const std::vector&); // NOTE(chenweihang): InferShape can't support std::vector attr type, // because the input type is std::vector, only can use one rule to // parse std::vector parameter // NOTE(chenweihang): Used to be compatible with the 2.0.1 released // interface, and will be deprecated in the future PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const bool&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const int&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const float&); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(const int64_t&); // NOTE(chenweihang): Used to be compatible with the 2.1 released // interface, but not recommended PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(std::string); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(std::vector); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(std::vector); PD_SPECIALIZE_InferShapeCallHelper_FOR_ATTR(std::vector); // end: base template template struct InferShapeCallHelper> { template static Return InferShape( const std::vector>& input_shapes, const std::vector>>& vec_input_shapes, const std::vector& attrs, const Args&... args) { return impl_fn(args...); } }; }; #define PD_INFER_SHAPE(...) \ ::paddle::InferShapeFuncImpl::InferShape /////////////// InferDataType Function (PD_INFER_DTYPE) /////////////// // Record Op Infer dtype core function using InferDtypeFunc = std::vector (*)( const std::vector& input_dtypes, const std::vector>& vec_input_dtypes); #define PD_SPECIALIZE_InferDtypeCallHelper_TO_DTYPE(input_type) \ template \ struct InferDtypeCallHelper { \ template \ static Return InferDtype( \ const std::vector& input_dtypes, \ const std::vector>& vec_input_dtypes, \ const PreviousArgs&... pargs) { \ input_type arg = input_dtypes[in_idx]; \ return InferDtypeCallHelper::template InferDtype( \ input_dtypes, vec_input_dtypes, pargs..., arg); \ } \ } #define PD_SPECIALIZE_InferDtypeCallHelper_FOR_DTYPES(input_type) \ template \ struct InferDtypeCallHelper { \ template \ static Return InferDtype( \ const std::vector& input_dtypes, \ const std::vector>& vec_input_dtypes, \ const PreviousArgs&... pargs) { \ input_type arg = vec_input_dtypes[vec_in_idx]; \ return InferDtypeCallHelper::template InferDtype( \ input_dtypes, vec_input_dtypes, pargs..., arg); \ } \ } template struct InferDtypeFuncImpl; template struct InferDtypeFuncImpl { static Return InferDtype( const std::vector& input_dtypes, const std::vector>& vec_input_dtypes) { return InferDtypeCallHelper>::template InferDtype<0, 0>( input_dtypes, vec_input_dtypes); } private: template struct InferDtypeCallHelper; PD_SPECIALIZE_InferDtypeCallHelper_TO_DTYPE(const DataType&); PD_SPECIALIZE_InferDtypeCallHelper_FOR_DTYPES(const std::vector&); // NOTE(chenweihang): Used to be compatible with the 2.0.1 released // interface, and will be deprecated in the future PD_SPECIALIZE_InferDtypeCallHelper_TO_DTYPE(DataType); PD_SPECIALIZE_InferDtypeCallHelper_FOR_DTYPES(std::vector); // end: base template template struct InferDtypeCallHelper> { template static Return InferDtype( const std::vector& input_dtypes, const std::vector>& vec_input_dtypes, const Args&... args) { return impl_fn(args...); } }; }; #define PD_INFER_DTYPE(...) \ ::paddle::InferDtypeFuncImpl::InferDtype ////////////////////// Op Meta Info ////////////////////// class PADDLE_API OpMetaInfo { public: explicit OpMetaInfo(const std::string& op_name) : name_(op_name) {} // format: {"", "", ...} OpMetaInfo& Inputs(std::vector&& inputs); // format: {"", "", ...} OpMetaInfo& Outputs(std::vector&& outputs); // format: {":", ":", ...} OpMetaInfo& Attrs(std::vector&& attrs); // format: PD_KERNEL(...) OpMetaInfo& SetKernelFn(KernelFunc&& func); // format: PD_INFER_SHAPE(...) OpMetaInfo& SetInferShapeFn(InferShapeFunc&& func); // format: PD_INFER_DTYPE(...) OpMetaInfo& SetInferDtypeFn(InferDtypeFunc&& func); private: friend class framework::OpMetaInfoHelper; // 1. desc info std::string name_; std::vector inputs_; std::vector outputs_; std::vector attrs_; // 2. func info KernelFunc kernel_fn_{nullptr}; InferShapeFunc infer_shape_fn_{nullptr}; InferDtypeFunc infer_dtype_fn_{nullptr}; }; //////////////// Op Meta Info Map ///////////////// class PADDLE_API OpMetaInfoMap { public: // this function's impl should keep in header file. // if move to cc file, meta info can not be added // into map static OpMetaInfoMap& Instance() { static OpMetaInfoMap g_custom_op_meta_info_map; return g_custom_op_meta_info_map; } std::vector& operator[](const std::string& name); const std::unordered_map>& GetMap() const; private: OpMetaInfoMap() = default; std::unordered_map> map_; PD_DISABLE_COPY_AND_ASSIGN(OpMetaInfoMap); }; //////////////// Op Meta Info Builder ///////////////// class PADDLE_API OpMetaInfoBuilder { public: explicit OpMetaInfoBuilder(std::string&& name, size_t index); OpMetaInfoBuilder& Inputs(std::vector&& inputs); OpMetaInfoBuilder& Outputs(std::vector&& outputs); OpMetaInfoBuilder& Attrs(std::vector&& attrs); OpMetaInfoBuilder& SetKernelFn(KernelFunc func); OpMetaInfoBuilder& SetInferShapeFn(InferShapeFunc func); OpMetaInfoBuilder& SetInferDtypeFn(InferDtypeFunc func); private: // Forward Op name std::string name_; // ref current info ptr OpMetaInfo* info_ptr_; // The current op meta info index in vector // - 0: op, 1: grad_op, 2: grad_grad_op size_t index_; }; /////////////////////// Op register API ///////////////////////// // For inference: compile directly with framework // Call after PD_BUILD_OP(...) void RegisterAllCustomOperator(); // Using this api to load compiled custom operator's dynamic library and // register Custom // Operator into it void LoadCustomOperatorLib(const std::string& dso_name); /////////////////////// Op register Macro ///////////////////////// #define PD_BUILD_OP(op_name) \ STATIC_ASSERT_GLOBAL_NAMESPACE( \ __reg_op__##op_name, "PD_BUILD_OP must be called in global namespace."); \ static ::paddle::OpMetaInfoBuilder __op_meta_info_##op_name##__ = \ ::paddle::OpMetaInfoBuilder(#op_name, 0) #define PD_BUILD_GRAD_OP(op_name) \ STATIC_ASSERT_GLOBAL_NAMESPACE( \ __reg_grad_op__##op_name, \ "PD_BUILD_GRAD_OP must be called in global namespace."); \ static ::paddle::OpMetaInfoBuilder __grad_op_meta_info_##op_name##__ = \ ::paddle::OpMetaInfoBuilder(#op_name, 1) #define PD_BUILD_DOUBLE_GRAD_OP(op_name) \ STATIC_ASSERT_GLOBAL_NAMESPACE( \ __reg_grad_grad_op__##op_name, \ "PD_BUILD_DOUBLE_GRAD_OP must be called in global namespace."); \ static ::paddle::OpMetaInfoBuilder __grad_grad_op_meta_info_##op_name##__ = \ ::paddle::OpMetaInfoBuilder(#op_name, 2) } // namespace paddle ///////////////////// C API /////////////////// #ifdef __cplusplus extern "C" { #endif #if defined(_WIN32) // C-API to get global OpMetaInfoMap. __declspec(dllexport) inline paddle::OpMetaInfoMap& PD_GetOpMetaInfoMap() { return paddle::OpMetaInfoMap::Instance(); } #endif // _WIN32 #ifdef __cplusplus } #endif