/* Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #pragma once #include #include #include #include #include #include #include "paddle/fluid/distributed/auto_parallel/auto_parallel.pb.h" #include "paddle/fluid/distributed/auto_parallel/process_mesh.h" #include "paddle/fluid/distributed/auto_parallel/utils.h" #include "paddle/fluid/platform/enforce.h" namespace paddle { // Forward Declaration namespace framework { class BlockDesc; class OpDesc; class ProgramDesc; class VarDesc; } // namespace framework namespace distributed { namespace auto_parallel { using framework::BlockDesc; using framework::OpDesc; using framework::ProgramDesc; using framework::VarDesc; constexpr const char* kDefault = "default"; class TensorDistAttr { public: TensorDistAttr() = default; explicit TensorDistAttr(const VarDesc& tensor); TensorDistAttr(const TensorDistAttr& tensor); TensorDistAttr& operator=(const TensorDistAttr& dist_attr); void copy_from(const TensorDistAttr& dist_attr); const ProcessMesh& process_mesh() const { return process_mesh_; } void set_process_mesh(const ProcessMesh& process_mesh); const std::vector& dims_mapping() const { return dims_mapping_; } void set_dims_mapping(const std::vector& dims_mapping); void set_default_dims_mapping(const std::vector& tensor_shape); int64_t batch_dim() const { return batch_dim_; } void set_batch_dim(int64_t batch_dim); const std::vector& dynamic_dims() const { return dynamic_dims_; } void set_dynamic_dims(const std::vector& dynamic_dims); void set_default_dynamic_dims(const std::vector& tensor_shape); const std::map& annotated() const { return annotated_; } void set_annotated(const std::map& annotated); bool is_annotated(const std::string& name) const { return annotated_.count(name) == 1 && annotated_.at(name) == true; } void mark_annotated(const std::string& name); void clear_annotated() { annotated_.clear(); } bool verify_process_mesh(const ProcessMesh& process_mesh) const; bool verify_dims_mapping(const std::vector& dims_mapping, const std::vector& tensor_shape) const; bool verify_batch_dim(int64_t dim, const std::vector& tensor_shape) const; bool verify_dynamic_dims(const std::vector& dynamic_dims, const std::vector& tensor_shape) const; bool verify_annotated(const std::map& annotated) const; bool verify(const VarDesc* tensor = nullptr) const; // TensorDistAttr from_string(const std::string& dist_str); std::string to_string() const; void from_proto(const TensorDistAttrProto& proto); TensorDistAttrProto to_proto() const; std::string serialize_to_string(); void parse_from_string(const std::string& data); private: static std::vector fields_; ProcessMesh process_mesh_; std::vector dims_mapping_; int64_t batch_dim_{0}; std::vector dynamic_dims_; std::map annotated_; }; inline std::ostream& operator<<(std::ostream& os, const TensorDistAttr& obj) { os << obj.to_string(); return os; } bool operator==(const TensorDistAttr& lhs, const TensorDistAttr& rhs); inline bool operator!=(const TensorDistAttr& lhs, const TensorDistAttr& rhs) { return !operator==(lhs, rhs); } class OperatorDistAttr { public: OperatorDistAttr() = default; explicit OperatorDistAttr(const OpDesc& op); OperatorDistAttr(const OperatorDistAttr& dist_attr); OperatorDistAttr& operator=(const OperatorDistAttr& dist_attr); void initialize(const OpDesc* op = nullptr); void copy_from(const OperatorDistAttr& dist_attr); const std::map& input_dist_attrs() const { return input_dist_attrs_; } std::map& input_dist_attrs() { return input_dist_attrs_; } void set_input_dist_attrs( const std::map& dist_attrs); const std::map& output_dist_attrs() const { return output_dist_attrs_; } std::map& output_dist_attrs() { return output_dist_attrs_; } void set_output_dist_attrs( const std::map& dist_attrs); const TensorDistAttr& input_dist_attr(const std::string& name) const { return input_dist_attrs_.at(name); } TensorDistAttr& input_dist_attr(const std::string& name) { return input_dist_attrs_.at(name); } void set_input_dist_attr(const std::string& name, const TensorDistAttr& dist_attr); const TensorDistAttr& output_dist_attr(const std::string& name) const { return output_dist_attrs_.at(name); } TensorDistAttr& output_dist_attr(const std::string& name) { return output_dist_attrs_.at(name); } void set_output_dist_attr(const std::string& name, const TensorDistAttr& dist_attr); const ProcessMesh& process_mesh() const { return process_mesh_; } void set_process_mesh(const ProcessMesh& process_mesh); const std::string& op_type() const { return op_type_; } void set_op_type(const std::string& op_type) { op_type_ = op_type; } const std::string& impl_type() const { return impl_type_; } void set_impl_type(const std::string& impl_type) { impl_type_ = impl_type; } int64_t impl_idx() const { return impl_idx_; } void set_impl_idx(const int64_t& impl_idx) { impl_idx_ = impl_idx; } bool is_recompute() const { return is_recompute_; } void set_is_recompute(bool is_recompute) { is_recompute_ = is_recompute; } const std::string& execution_stream() const { return execution_stream_; } void set_execution_stream(const std::string& execution_stream) { execution_stream_ = execution_stream; } int64_t scheduling_priority() const { return scheduling_priority_; } void set_scheduling_priority(int64_t scheduling_priority) { scheduling_priority_ = scheduling_priority; } const std::map& annotated() const { return annotated_; } void set_annotated(const std::map& annotated); bool is_annotated(const std::string& name) const { return annotated_.count(name) == 1 && annotated_.at(name) == true; } void mark_annotated(const std::string& name); void clear_annotated(); const std::vector& input_dims_mapping(const std::string& name) const; void set_input_dims_mapping(const std::string& name, const std::vector& dims_mapping); const std::vector& output_dims_mapping(const std::string& name); void set_output_dims_mapping(const std::string& name, const std::vector& dims_mapping); bool verify_input_dist_attr(const std::string& name, const TensorDistAttr& dist_attr, const VarDesc* tensor) const; bool verify_output_dist_attr(const std::string& name, const TensorDistAttr& dist_attr, const VarDesc* tensor) const; bool verify_process_mesh(const ProcessMesh& process_mesh) const; bool verify_annotated(const std::map& annotated) const; bool verify(const OpDesc* op = nullptr) const; void rename_input(const std::string& old_name, const std::string& new_name); void rename_output(const std::string& old_name, const std::string& new_name); // OperatorDistAttr from_string(const std::string& dist_str); std::string to_string() const; void from_proto(const OperatorDistAttrProto& proto); OperatorDistAttrProto to_proto() const; std::string serialize_to_string(); void parse_from_string(const std::string& data); private: static std::vector fields_; std::map input_dist_attrs_; std::map output_dist_attrs_; ProcessMesh process_mesh_; std::string op_type_; std::string impl_type_ = kDefault; int64_t impl_idx_ = 0; bool is_recompute_ = false; std::string execution_stream_ = kDefault; int64_t scheduling_priority_ = 0; // lower value, higher priority std::map annotated_; }; inline std::ostream& operator<<(std::ostream& os, const OperatorDistAttr& obj) { os << obj.to_string(); return os; } bool operator==(const OperatorDistAttr& lhs, const OperatorDistAttr& rhs); inline bool operator!=(const OperatorDistAttr& lhs, const OperatorDistAttr& rhs) { return !operator==(lhs, rhs); } } // namespace auto_parallel } // namespace distributed } // namespace paddle