// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/fluid/framework/executor_gc_helper.h" #include #include "glog/logging.h" #include "paddle/fluid/framework/block_desc.h" #include "paddle/fluid/framework/no_need_buffer_vars_inference.h" #include "paddle/fluid/framework/op_info.h" #include "paddle/fluid/framework/op_registry.h" #include "paddle/fluid/framework/operator.h" #include "paddle/fluid/framework/var_desc.h" #include "paddle/fluid/operators/controlflow/conditional_block_op_helper.h" #include "paddle/fluid/operators/controlflow/recurrent_op_helper.h" #include "paddle/fluid/operators/controlflow/while_op_helper.h" #include "paddle/fluid/platform/enforce.h" namespace paddle { namespace framework { void OpInOutInfo::Build(const OperatorBase *op) { is_built_ = true; auto &inferer = op->Info().NoNeedBufferVarsInferer(); if (inferer) { no_need_buffer_ins_ = inferer(op->Inputs(), op->Outputs(), op->Attrs()); if (no_need_buffer_ins_.empty()) return; for (auto &in_name_pair : op->Inputs()) { if (no_need_buffer_ins_.count(in_name_pair.first) != 0) { continue; } for (auto &in_arg_name : in_name_pair.second) { other_args_set_.insert(in_arg_name); } } for (auto &out_name_pair : op->Outputs()) { for (auto &out_arg_name : out_name_pair.second) { other_args_set_.insert(out_arg_name); } } } } bool OpInOutInfo::IsInArgBufferNeeded(const std::string &in_arg_name) const { return no_need_buffer_ins_.empty() || other_args_set_.count(in_arg_name) != 0; } static bool VarCanBeDeleted(const std::string &name, const BlockDesc &block, const std::unordered_set &skip_vars) { if (skip_vars.count(name) != 0) { return false; } auto *var_desc = block.FindVar(name); if (var_desc == nullptr || var_desc->Persistable()) { return false; } auto type = var_desc->Proto()->type().type(); return type == proto::VarType::LOD_TENSOR || type == proto::VarType::SELECTED_ROWS || type == proto::VarType::LOD_TENSOR_ARRAY; } std::unordered_map> GetUnusedVars(const BlockDesc &block, const std::vector> &ops, const std::vector &skip_var_list) { std::unordered_set skip_vars(skip_var_list.begin(), skip_var_list.end()); std::unordered_map var_op_idx_map; for (size_t i = 0; i < ops.size(); ++i) { auto *op = ops[i].get(); OpInOutInfo info; for (auto &name_pair : op->Inputs()) { for (auto &name : name_pair.second) { if (!VarCanBeDeleted(name, block, skip_vars)) { continue; } // var can be gc-ed if (!info.IsBuilt()) { info.Build(op); } if (info.IsInArgBufferNeeded(name)) { // Update the last living op of variable to current op var_op_idx_map[name] = i; } else { VLOG(10) << "Skip reference count computing of variable " << name_pair.first << "(" << name << ") in Operator " << op->Type(); } } } for (auto &name_pair : op->Outputs()) { for (auto &name : name_pair.second) { if (VarCanBeDeleted(name, block, skip_vars)) { // Update the last living op of variable to current op var_op_idx_map[name] = i; } } } } std::unordered_map> result; for (auto &name_op_idx_pair : var_op_idx_map) { auto &name = name_op_idx_pair.first; size_t op_idx = name_op_idx_pair.second; result[ops[op_idx].get()].emplace_back(name); } return result; } void DeleteUnusedTensors(const Scope &scope, const std::vector &delete_vars, GarbageCollector *gc) { std::deque> garbages; for (auto &var_name : delete_vars) { auto *var = scope.FindVar(var_name); if (var == nullptr) { continue; } VLOG(2) << "Erase variable " << var_name; if (var->IsType()) { garbages.emplace_back(var->GetMutable()->MoveMemoryHolder()); } else if (var->IsType()) { garbages.emplace_back(var->GetMutable() ->mutable_value() ->MoveMemoryHolder()); } else if (var->IsType()) { auto *lod_tensor_arr = var->GetMutable(); for (auto &t : *lod_tensor_arr) { garbages.emplace_back(t.MoveMemoryHolder()); } } else if (var->IsType()) { } else { PADDLE_THROW(platform::errors::Unimplemented( "Type %s of variable %s is not supported eager deletion.", framework::ToTypeName(var->Type()), var_name)); } } if (!garbages.empty()) { gc->Add(std::move(garbages)); } } void DeleteUnusedTensors( const Scope &scope, const OperatorBase *op, const std::unordered_map> &delete_vars_map, GarbageCollector *gc) { auto iter = delete_vars_map.find(op); if (iter == delete_vars_map.end()) { return; } auto &delete_vars = iter->second; DeleteUnusedTensors(scope, delete_vars, gc); } static std::vector> CreateOpsFromBlock( const BlockDesc &block) { std::vector> ops; size_t op_num = block.OpSize(); ops.reserve(op_num); for (size_t i = 0; i < op_num; ++i) { auto *op_desc = block.Op(i); ops.push_back(OpRegistry::CreateOp(*op_desc)); } return ops; } std::vector>> GetEagerDeletionCleanVars( const ProgramDesc &origin_program, const std::vector &skip_vars) { ProgramDesc program{origin_program}; size_t block_num = program.Size(); PADDLE_ENFORCE_GE(block_num, 1, platform::errors::PermissionDenied( "Program should have at least one block")); // prepare safe GCs on sub block ops auto global_block_ops = CreateOpsFromBlock(program.Block(0)); operators::PrepareSafeEagerDeletionOnConditionalOpAndConditionalGradOp( program, 0, global_block_ops); operators::PrepareSafeEagerDeletionOnWhileOpAndWhileGradOp(program, 0, global_block_ops); operators::PrepareSafeEagerDeletionOnRecurrentOpAndRecurrentGradOp( program, 0, global_block_ops); // find the skip vars on each block std::vector> skip_vars_on_each_block(block_num); skip_vars_on_each_block[0] = skip_vars; std::vector found_skip_vars(block_num, false); found_skip_vars[0] = true; const char *kSubBlock = "sub_block"; const char *kSkipEagerDeletionVars = "skip_eager_deletion_vars"; for (size_t i = 0; i < block_num; ++i) { const auto &block = program.Block(i); size_t op_num = block.OpSize(); for (size_t j = 0; j < op_num; ++j) { auto *op = block.Op(j); if (!op->HasAttr(kSubBlock) || !op->HasAttr(kSkipEagerDeletionVars)) { continue; } auto sub_block_id = op->GetAttrIfExists(kSubBlock)->ID(); PADDLE_ENFORCE_GE(sub_block_id, 0, platform::errors::PermissionDenied( "sub_block id must be non-negative number")); PADDLE_ENFORCE_LT(sub_block_id, block_num, platform::errors::PermissionDenied( "sub_block id exceeds max block num")); PADDLE_ENFORCE_EQ( found_skip_vars[sub_block_id], false, platform::errors::PermissionDenied( "there are 2 ops which refer to the same sub_block %d", sub_block_id)); found_skip_vars[sub_block_id] = true; auto sub_block_skip_vars = op->GetAttrIfExists>(kSkipEagerDeletionVars); skip_vars_on_each_block[sub_block_id] = std::move(sub_block_skip_vars); } } std::vector>> result; result.reserve(block_num); for (size_t i = 0; i < block_num; ++i) { const auto &block = program.Block(i); const auto block_ops = CreateOpsFromBlock(block); const auto &block_skip_vars = skip_vars_on_each_block[i]; auto delete_var_map = GetUnusedVars(block, block_ops, block_skip_vars); std::vector> block_result; block_result.reserve(block_ops.size()); for (const auto &op : block_ops) { auto &delete_vars = delete_var_map[op.get()]; std::sort(delete_vars.begin(), delete_vars.end()); // for stable result block_result.emplace_back(delete_vars); } result.emplace_back(std::move(block_result)); } return result; } } // namespace framework } // namespace paddle