// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "framework/dag.h" #include #include #include "common/inner_common.h" #include "framework/predictor_metric.h" // PredictorMetric #include "op/op.h" namespace baidu { namespace paddle_serving { namespace predictor { Dag::Dag() { _index_nodes.clear(); _name_nodes.clear(); _stages.clear(); } Dag::~Dag() { deinit(); } int Dag::deinit() { for (std::vector::iterator iter = _stages.begin(); iter != _stages.end(); ++iter) { if (*iter != NULL) { delete *iter; } } _stages.clear(); for (std::vector::iterator iter = _index_nodes.begin(); iter != _index_nodes.end(); ++iter) { DagNode* node = *iter; if (node != NULL) { void* conf = node->conf; if (conf != NULL) { Op* op = OpRepository::instance().get_op(node->type); if (op == NULL) { LOG(ERROR) << "Failed to get_op, op type[" << node->type << "]"; return -1; } op->delete_config(conf); OpRepository::instance().return_op(node->type, op); } delete node; } } _index_nodes.clear(); _name_nodes.clear(); return 0; } EdgeMode Dag::parse_mode(std::string& mode) { if (mode == "RO") { return RO; } else if (mode == "RW") { return RW; } else { return UNKNOWN; } } // [@Node] // name: preprocess // type: ProcessorOp // [.@Depend] // name: StartupOp // mode: RO // [@Node] // name: discret_extractor // type: DiscretExtractOp // [.@Depend] // name: StartupOp // mode: RO // [.@Depend] // name: preprocess // mode: RW // [@Node] // name: dnn_inference // type: PaddleV2InferenceOp // [.@Depend] // name: discret_extractor // mode: RO // [@Node] // name: postprocess // type: PostProcessOp // [.@Depend] // name: dnn_inference // mode: RO #if 0 int Dag::init(const char* path, const char* file, const std::string& name) { comcfg::Configure conf; if (conf.load(path, file) != 0) { LOG(ERROR) << "Failed load conf from" << path << "/" << file << " in dag: " << name; return ERR_INTERNAL_FAILURE; } return init(conf, name); } #endif int Dag::init(const configure::Workflow& conf, const std::string& name) { _dag_name = name; _index_nodes.clear(); _name_nodes.clear(); for (uint32_t i = 0; i < conf.nodes_size(); i++) { DagNode* node = new (std::nothrow) DagNode(); if (node == NULL) { LOG(ERROR) << "Failed create new dag node"; return ERR_MEM_ALLOC_FAILURE; } node->id = i + 1; // 0 is reserved for begginer-op node->name = conf.nodes(i).name(); node->type = conf.nodes(i).type(); uint32_t depend_size = conf.nodes(i).dependencies_size(); for (uint32_t j = 0; j < depend_size; j++) { const configure::DAGNodeDependency& depend = conf.nodes(i).dependencies(j); std::string name = depend.name(); std::string mode = depend.mode(); node->depends.insert(std::make_pair(name, parse_mode(mode))); } Op* op = OpRepository::instance().get_op(node->type); if (op == NULL) { LOG(ERROR) << "Failed to get_op, op type[" << node->type << "]"; return ERR_INTERNAL_FAILURE; } // node->conf could be NULL node->conf = op->create_config(conf.nodes(i)); OpRepository::instance().return_op(node->type, op); _name_nodes.insert(std::make_pair(node->name, node)); _index_nodes.push_back(node); } if (topo_sort() != 0) { LOG(ERROR) << "Topo sort dag[" << _dag_name << "] failed!"; return ERR_INTERNAL_FAILURE; } if (FLAGS_el_log_level == 16) { LOG(INFO) << "DAG: " << _dag_name; LOG(INFO) << ", Op Num: " << _index_nodes.size(); for (uint32_t nid = 0; nid < _index_nodes.size(); nid++) { DagNode* node = _index_nodes[nid]; LOG(INFO) << ", OP-" << node->id << "-" << node->name << "-" << node->type; LOG(INFO) << " depends: " << node->depends.size(); boost::unordered_map::iterator it; for (it = node->depends.begin(); it != node->depends.end(); it++) { LOG(INFO) << " " << it->first << " " << it->second; } } LOG(INFO) << ""; } return ERR_OK; } uint32_t Dag::nodes_size() { return _index_nodes.size(); } const DagNode* Dag::node_by_id(uint32_t id) { return _index_nodes[id]; } const DagNode* Dag::node_by_id(uint32_t id) const { return _index_nodes[id]; } const DagNode* Dag::node_by_name(std::string& name) { return _name_nodes[name]; } const DagNode* Dag::node_by_name(const std::string& name) const { boost::unordered_map::const_iterator it; it = _name_nodes.find(name); if (it == _name_nodes.end()) { LOG(WARNING) << "Not found op by name:" << name; return NULL; } return it->second; } uint32_t Dag::stage_size() { return _stages.size(); } const DagStage* Dag::stage_by_index(uint32_t index) { return _stages[index]; } int Dag::topo_sort() { std::stringstream ss; for (uint32_t nid = 0; nid < _index_nodes.size(); nid++) { DagStage* stage = new (std::nothrow) DagStage(); if (stage == NULL) { LOG(ERROR) << "Invalid stage!"; return ERR_MEM_ALLOC_FAILURE; } stage->nodes.push_back(_index_nodes[nid]); ss.str(""); ss << _stages.size(); stage->name = ss.str(); stage->full_name = full_name() + NAME_DELIMITER + stage->name; _stages.push_back(stage); // assign stage number after stage created _index_nodes[nid]->stage = nid; // assign dag node full name after stage created _index_nodes[nid]->full_name = stage->full_name + NAME_DELIMITER + _index_nodes[nid]->name; } return ERR_OK; } void Dag::regist_metric(const std::string& service_name) { for (int stage_idx = 0; stage_idx < _stages.size(); ++stage_idx) { DagStage* stage = _stages[stage_idx]; PredictorMetric::GetInstance()->regist_latency_metric( STAGE_METRIC_PREFIX + service_name + NAME_DELIMITER + stage->full_name); for (int node_idx = 0; node_idx < stage->nodes.size(); ++node_idx) { DagNode* node = stage->nodes[node_idx]; PredictorMetric::GetInstance()->regist_latency_metric( OP_METRIC_PREFIX + service_name + NAME_DELIMITER + node->full_name); Op* op = OpRepository::instance().get_op(node->type); if (op == NULL) { LOG(ERROR) << "Failed to get_op, op type[" << node->type << "]"; return; } op->set_full_name(service_name + NAME_DELIMITER + node->full_name); op->set_config(node->conf); op->regist_metric(); OpRepository::instance().return_op(node->type, op); } } } } // namespace predictor } // namespace paddle_serving } // namespace baidu