diff --git a/paddle/fluid/distributed/ps/service/brpc_ps_server.cc b/paddle/fluid/distributed/ps/service/brpc_ps_server.cc index 58ce52552c9d22c56b314dfe0bccbb8a564edb5d..747b0cbb325d0d6c27808a73e8af1386f557fd04 100644 --- a/paddle/fluid/distributed/ps/service/brpc_ps_server.cc +++ b/paddle/fluid/distributed/ps/service/brpc_ps_server.cc @@ -188,7 +188,8 @@ void BrpcPsService::service(google::protobuf::RpcController *cntl_base, int32_t BrpcPsService::pull_dense(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->pull_dense"); + platform::RecordEvent record_event( + "PsService->pull_dense", platform::TracerEventType::Communication, 1); CHECK_TABLE_EXIST(table, request, response) if (request.params_size() < 1) { set_response_code( @@ -219,7 +220,9 @@ int32_t BrpcPsService::push_dense_param(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->push_dense_param"); + platform::RecordEvent record_event("PsService->push_dense_param", + platform::TracerEventType::Communication, + 1); CHECK_TABLE_EXIST(table, request, response) thread_local std::string push_buffer; auto &req_io_buffer = cntl->request_attachment(); @@ -245,7 +248,8 @@ int32_t BrpcPsService::push_dense_param(Table *table, int32_t BrpcPsService::push_dense(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->push_dense"); + platform::RecordEvent record_event( + "PsService->push_dense", platform::TracerEventType::Communication, 1); CHECK_TABLE_EXIST(table, request, response) auto req_buffer_size = request.data().size(); if (req_buffer_size < 1) { @@ -291,7 +295,9 @@ int32_t BrpcPsService::push_sparse_param(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->push_sparse_param"); + platform::RecordEvent record_event("PsService->push_sparse_param", + platform::TracerEventType::Communication, + 1); CHECK_TABLE_EXIST(table, request, response) auto &push_data = request.data(); if (push_data.size() < 1) { @@ -323,7 +329,8 @@ int32_t BrpcPsService::pull_geo_param(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->pull_geo_param"); + platform::RecordEvent record_event( + "PsService->pull_geo_param", platform::TracerEventType::Communication, 1); CHECK_TABLE_EXIST(table, request, response) thread_local std::string push_sparse_request_buffer; @@ -346,7 +353,8 @@ int32_t BrpcPsService::pull_sparse(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->pull_sparse"); + platform::RecordEvent record_event( + "PsService->pull_sparse", platform::TracerEventType::Communication, 1); CHECK_TABLE_EXIST(table, request, response) auto &req_io_buffer = cntl->request_attachment(); @@ -392,7 +400,8 @@ int32_t BrpcPsService::push_sparse(Table *table, const PsRequestMessage &request, PsResponseMessage &response, brpc::Controller *cntl) { - platform::RecordEvent record_event("PsService->push_sparse"); + platform::RecordEvent record_event( + "PsService->push_sparse", platform::TracerEventType::Communication, 1); CHECK_TABLE_EXIST(table, request, response) auto &push_data = request.data(); if (push_data.size() < 1) { diff --git a/paddle/fluid/distributed/ps/service/communicator/communicator.cc b/paddle/fluid/distributed/ps/service/communicator/communicator.cc index f47415812e51d5cb6fc79a814e3d88ae0f109d66..6dbe8ba3a0b909aad11f49ce748a3ac8ffc37965 100644 --- a/paddle/fluid/distributed/ps/service/communicator/communicator.cc +++ b/paddle/fluid/distributed/ps/service/communicator/communicator.cc @@ -113,7 +113,9 @@ int Communicator::SetClients(std::vector &host_sign_list) { void Communicator::RpcRecvDense(const std::vector &varnames, int table_id, Scope *scope) { - platform::RecordEvent record_event("Communicator->RpcRecvDense"); + platform::RecordEvent record_event("Communicator->RpcRecvDense", + platform::TracerEventType::Communication, + 1); std::vector regions; regions.reserve(varnames.size()); for (auto &t : varnames) { @@ -169,7 +171,9 @@ void Communicator::RpcRecvDense(const std::vector &varnames, void Communicator::RpcSendDenseParam(const std::vector &varnames, int table_id, const Scope &scope) { - platform::RecordEvent record_event("Communicator->RpcSendDenseParam"); + platform::RecordEvent record_event("Communicator->RpcSendDenseParam", + platform::TracerEventType::Communication, + 1); auto place = platform::CPUPlace(); std::vector regions; for (auto &t : varnames) { @@ -206,7 +210,9 @@ void Communicator::RpcSendDenseParam(const std::vector &varnames, } void Communicator::RpcSendDense(const CommContext &ctx, const Scope &scope) { - platform::RecordEvent record_event("Communicator->RpcSendDense"); + platform::RecordEvent record_event("Communicator->RpcSendDense", + platform::TracerEventType::Communication, + 1); auto &var_names = ctx.origin_varnames; auto &table_id = ctx.table_id; auto dense_data = std::make_shared>(); @@ -250,7 +256,9 @@ void Communicator::RpcSendDense(const CommContext &ctx, const Scope &scope) { void Communicator::RpcSendSparseParam(const std::string &varname, int table_id, const Scope &scope) { - platform::RecordEvent record_event("Communicator->RpcSendSparseParam"); + platform::RecordEvent record_event("Communicator->RpcSendSparseParam", + platform::TracerEventType::Communication, + 1); size_t request_call_num = _worker_ptr->get_server_nums(); std::vector push_g_vec; @@ -287,7 +295,9 @@ void Communicator::RpcSendSparseParam(const std::string &varname, int table_id, void Communicator::RpcSendSparse(const std::string &var_name, int table_id, const Scope &scope) { - platform::RecordEvent record_event("Communicator->RpcSendSparse"); + platform::RecordEvent record_event("Communicator->RpcSendSparse", + platform::TracerEventType::Communication, + 1); size_t request_call_num = _worker_ptr->get_server_nums(); std::vector sparse_push_keys; std::vector push_g_vec; @@ -338,7 +348,9 @@ void Communicator::RpcSendSparse(const std::string &var_name, int table_id, void Communicator::RpcRecvSparse(const std::string &varname, int table_id, Scope *scope) { - platform::RecordEvent record_event("Communicator->RpcRecvSparse"); + platform::RecordEvent record_event("Communicator->RpcRecvSparse", + platform::TracerEventType::Communication, + 1); auto *send_var = scope->Var(varname); auto *tensor = send_var->GetMutable(); auto dim = tensor->dims()[1]; @@ -406,7 +418,9 @@ void Communicator::SendGlobalStep(const CommContext &ctx, int batches, if (batches == 0) { return; } - platform::RecordEvent record_event("Communicator->SendGlobalStep"); + platform::RecordEvent record_event("Communicator->SendGlobalStep", + platform::TracerEventType::Communication, + 1); auto &table_id = ctx.table_id; size_t request_call_num = _worker_ptr->get_server_nums(); @@ -994,7 +1008,8 @@ void SyncCommunicator::BarrierRecv() { void GeoCommunicator::Send(const std::vector &var_names, const framework::Scope &scope) { - platform::RecordEvent record_event("GeoCommunicator->Send"); + platform::RecordEvent record_event( + "GeoCommunicator->Send", platform::TracerEventType::Communication, 1); waiting_ = false; auto before_send = GetCurrentUS(); auto table_name = var_names[0]; @@ -1137,7 +1152,9 @@ void GeoCommunicator::InitDense(std::vector &varnames, } void GeoCommunicator::SendDense(const CommContext &send_ctx) { - platform::RecordEvent record_event("GeoCommunicator->SendDense"); + platform::RecordEvent record_event("GeoCommunicator->SendDense", + platform::TracerEventType::Communication, + 1); auto &var_names = send_ctx.origin_varnames; auto &table_id = send_ctx.table_id; for (auto &varname : var_names) { @@ -1177,7 +1194,9 @@ void GeoCommunicator::SendDense(const CommContext &send_ctx) { } void GeoCommunicator::RecvDense(const CommContext &send_ctx) { - platform::RecordEvent record_event("GeoCommunicator->RecvDense"); + platform::RecordEvent record_event("GeoCommunicator->RecvDense", + platform::TracerEventType::Communication, + 1); auto &table_id = send_ctx.table_id; auto &varnames = recv_varname_to_ctx_.at(table_id); // 1. recv from pserver @@ -1235,7 +1254,9 @@ void GeoCommunicator::InitSparse(const std::string &var_name, int table_id) { std::vector GeoCommunicator::MergeSparseIds( const std::string &send_varname) { - platform::RecordEvent record_event("GeoCommunicator->MergeSparseIds"); + platform::RecordEvent record_event("GeoCommunicator->MergeSparseIds", + platform::TracerEventType::Communication, + 1); size_t merge_num = 0, wait_times = 0; std::unordered_set sparse_ids; while (merge_num < static_cast(max_merge_var_num_)) { @@ -1267,7 +1288,9 @@ std::vector GeoCommunicator::MergeSparseIds( void GeoCommunicator::SendSparse(const std::string &varname, std::vector &sparse_ids, int table_id, int ep_idx) { - platform::RecordEvent record_event("GeoCommunicator->SendSparse"); + platform::RecordEvent record_event("GeoCommunicator->SendSparse", + platform::TracerEventType::Communication, + 1); if (sparse_ids.size() == 0) { return; } @@ -1342,7 +1365,9 @@ void GeoCommunicator::SendSparse(const std::string &varname, void GeoCommunicator::RecvSparse(const std::string &varname, int table_id, int ep_idx) { - platform::RecordEvent record_event("GeoCommunicator->RecvSparse"); + platform::RecordEvent record_event("GeoCommunicator->RecvSparse", + platform::TracerEventType::Communication, + 1); // 1. recv from pserver std::vector keys; std::vector values; diff --git a/paddle/fluid/distributed/ps/service/heter_client.cc b/paddle/fluid/distributed/ps/service/heter_client.cc index 8aebae237360e108cac26c828bde64efa65e7882..d6287cda6d4438106b36f9b9f9ff1e93b3f140da 100644 --- a/paddle/fluid/distributed/ps/service/heter_client.cc +++ b/paddle/fluid/distributed/ps/service/heter_client.cc @@ -13,7 +13,6 @@ // limitations under the License. #include "paddle/fluid/distributed/ps/service/heter_client.h" - #include "paddle/fluid/framework/convert_utils.h" #include "paddle/fluid/platform/profiler.h" #include "paddle/fluid/string/split.h" @@ -152,7 +151,9 @@ void HeterClient::SendAndRecvAsync( const std::string& message_name, const std::vector& send_var_name, const std::vector& recv_var_name, const std::string& mode) { - platform::RecordEvent record_event("HeterClient->SendAndRecvAsync"); + platform::RecordEvent record_event("HeterClient->SendAndRecvAsync", + platform::TracerEventType::Communication, + 1); const platform::DeviceContext* p_ctx = &ctx; const framework::Scope* p_scope = &scope; const std::string message_name_val = message_name; diff --git a/paddle/fluid/distributed/ps/service/heter_server.h b/paddle/fluid/distributed/ps/service/heter_server.h index 86f83cb1fc4fe5ef881dbb2e8f88bd6d1bc67bc5..a14fb5f6cc04a58cab53b10a4f17cf3caaa402ed 100644 --- a/paddle/fluid/distributed/ps/service/heter_server.h +++ b/paddle/fluid/distributed/ps/service/heter_server.h @@ -213,7 +213,9 @@ class RequestSendAndRecvHandler final : public HeterRequestHandler { int Handle(const MultiVarMsg* request, MultiVarMsg* response, brpc::Controller* cntl) override { - platform::RecordEvent record_event("RequestSendAndRecvHandler->Handle"); + platform::RecordEvent record_event("RequestSendAndRecvHandler->Handle", + platform::TracerEventType::Communication, + 1); FLAGS_eager_delete_tensor_gb = -1; // get microID from request diff --git a/paddle/fluid/distributed/ps/service/ps_service/graph_py_service.cc b/paddle/fluid/distributed/ps/service/ps_service/graph_py_service.cc index b2aece98071c146b23e897900b9c7f9736c2f2de..088edcb75bbc67d6d2acef9609b442f6fa38c332 100644 --- a/paddle/fluid/distributed/ps/service/ps_service/graph_py_service.cc +++ b/paddle/fluid/distributed/ps/service/ps_service/graph_py_service.cc @@ -18,7 +18,7 @@ #include "iomanip" #include "paddle/fluid/distributed/ps/table/table.h" #include "paddle/fluid/framework/archive.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace distributed { std::vector GraphPyService::split(std::string& str, diff --git a/paddle/fluid/framework/details/all_reduce_op_handle.cc b/paddle/fluid/framework/details/all_reduce_op_handle.cc index 1facbe850ee5237f16ad92f140232f1394b2c4bf..50c544b39c163488458aeb9226bb10a381d89360 100644 --- a/paddle/fluid/framework/details/all_reduce_op_handle.cc +++ b/paddle/fluid/framework/details/all_reduce_op_handle.cc @@ -17,7 +17,7 @@ #include "paddle/fluid/framework/details/container_cast.h" #include "paddle/fluid/framework/details/reduce_and_gather.h" #include "paddle/fluid/platform/place.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" #if defined(PADDLE_WITH_NCCL) || defined(PADDLE_WITH_RCCL) DECLARE_bool(sync_nccl_allreduce); @@ -68,8 +68,8 @@ AllReduceOpHandle::AllReduceOpHandle(ir::Node *node, #endif void AllReduceOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); - + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); WaitInputVarGenerated(); std::vector inputs = this->Inputs(); std::vector outputs = this->Outputs(); diff --git a/paddle/fluid/framework/details/bind_threaded_ssa_graph_executor.cc b/paddle/fluid/framework/details/bind_threaded_ssa_graph_executor.cc index 0d8f71a7555ec293dd91beb273a3527ab8ae1d30..75baf15dc5ec953c817c02227e4f34424bc65515 100644 --- a/paddle/fluid/framework/details/bind_threaded_ssa_graph_executor.cc +++ b/paddle/fluid/framework/details/bind_threaded_ssa_graph_executor.cc @@ -23,7 +23,7 @@ #include "paddle/fluid/framework/details/multi_devices_helper.h" #include "paddle/fluid/framework/ir/graph_helper.h" #include "paddle/fluid/platform/device_context.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" #if defined(PADDLE_WITH_XPU) namespace paddle { diff --git a/paddle/fluid/framework/details/broadcast_op_handle.cc b/paddle/fluid/framework/details/broadcast_op_handle.cc index d058949ec6a1949aa3b48cbcc5e66a06ec1e9ce2..ff2e66082e69dc6b854a5a25b3976d50b392c10e 100644 --- a/paddle/fluid/framework/details/broadcast_op_handle.cc +++ b/paddle/fluid/framework/details/broadcast_op_handle.cc @@ -18,15 +18,15 @@ #include "paddle/fluid/framework/details/container_cast.h" #include "paddle/fluid/framework/details/variable_visitor.h" #include "paddle/fluid/platform/place.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { namespace details { void BroadcastOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); - + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); if (places_.size() == 1) return; // The input and output may have dummy vars. diff --git a/paddle/fluid/framework/details/eager_deletion_op_handle.cc b/paddle/fluid/framework/details/eager_deletion_op_handle.cc index c760e7a98614cb55dd5c39883601cf85df00d7c1..b8def1f1746471ff151788aa1ef54adef362e60b 100644 --- a/paddle/fluid/framework/details/eager_deletion_op_handle.cc +++ b/paddle/fluid/framework/details/eager_deletion_op_handle.cc @@ -15,7 +15,7 @@ #include "paddle/fluid/framework/details/eager_deletion_op_handle.h" #include "paddle/fluid/framework/ir/memory_optimize_pass/memory_optimization_var_info.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" #if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP) #include "paddle/fluid/platform/cuda_device_guard.h" #endif @@ -128,7 +128,8 @@ void EagerDeletionOpHandle::RunImpl() { CallOnce(); } - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event(Name(), + platform::TracerEventType::UserDefined, 2); std::deque> garbages; for (size_t i = 0; i < var_infos_.size(); ++i) { auto *var_info = var_infos_[i]; diff --git a/paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc b/paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc index 75998e4582e2bcf68569929963cedfc24874f547..1cf69a1a3d652a49226447c5559613378bd3ee17 100644 --- a/paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc +++ b/paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc @@ -24,7 +24,7 @@ #include "paddle/fluid/framework/details/fetch_async_op_handle.h" #include "paddle/fluid/framework/details/multi_devices_helper.h" #include "paddle/fluid/framework/ir/graph_helper.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { @@ -65,7 +65,8 @@ FetchResultType FastThreadedSSAGraphExecutor::Run( const std::vector &fetch_tensors, bool return_merged) { VLOG(3) << "enter FastThreadedSSAGraphExecutor Run"; std::unique_ptr event( - new platform::RecordEvent("FastThreadedSSAGraphExecutorPrepare")); + new platform::RecordEvent("FastThreadedSSAGraphExecutorPrepare", + platform::TracerEventType::UserDefined, 2)); std::unique_ptr>> op_deps = atomic_op_deps_.get(); PrepareAtomicOpDeps(); diff --git a/paddle/fluid/framework/details/fetch_async_op_handle.cc b/paddle/fluid/framework/details/fetch_async_op_handle.cc index 69c39acc5fe595dddbfc847fbf9240a8110b63a3..0731663de95f3f81239e05d19517e8a52b51d1f4 100644 --- a/paddle/fluid/framework/details/fetch_async_op_handle.cc +++ b/paddle/fluid/framework/details/fetch_async_op_handle.cc @@ -18,6 +18,7 @@ #include "paddle/fluid/framework/convert_utils.h" #include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { @@ -190,7 +191,8 @@ void FetchAsyncOpHandle::FetchMergedLodTensor( } void FetchAsyncOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event(Name(), + platform::TracerEventType::Operator, 1); WaitInputVarGenerated(true); // get src vars diff --git a/paddle/fluid/framework/details/fetch_op_handle.cc b/paddle/fluid/framework/details/fetch_op_handle.cc index 60e58fafa419836a0983f8542db4775af7954003..a4de29c8387ae5d0c4f5a76980920b606fdd0de4 100644 --- a/paddle/fluid/framework/details/fetch_op_handle.cc +++ b/paddle/fluid/framework/details/fetch_op_handle.cc @@ -16,7 +16,7 @@ #include -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { @@ -128,7 +128,8 @@ static void TransData(const framework::LoDTensor &src_item, } void FetchOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event(Name(), + platform::TracerEventType::Operator, 1); WaitInputVarGenerated(platform::CPUPlace()); tensors_.resize(inputs_.size()); diff --git a/paddle/fluid/framework/details/fused_all_reduce_op_handle.cc b/paddle/fluid/framework/details/fused_all_reduce_op_handle.cc index 8f76de2393eaaf40c3630903dc16ed4499b76376..f4ca4907d48d08a4a357c3e6d12d8c856e12358b 100644 --- a/paddle/fluid/framework/details/fused_all_reduce_op_handle.cc +++ b/paddle/fluid/framework/details/fused_all_reduce_op_handle.cc @@ -18,7 +18,7 @@ #include "paddle/fluid/framework/details/variable_visitor.h" #include "paddle/fluid/platform/device_memory_aligment.h" #include "paddle/fluid/platform/place.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" DEFINE_bool(skip_fused_all_reduce_check, false, ""); DECLARE_bool(allreduce_record_one_event); @@ -68,7 +68,8 @@ FusedAllReduceOpHandle::~FusedAllReduceOpHandle() { } void FusedAllReduceOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); VLOG(4) << this->DebugString(); #if defined(PADDLE_WITH_NCCL) || defined(PADDLE_WITH_RCCL) diff --git a/paddle/fluid/framework/details/fused_broadcast_op_handle.cc b/paddle/fluid/framework/details/fused_broadcast_op_handle.cc index 51ed1ca01b660555a79babbfe1022d4b18b098c1..2490f3d6102da13ea192c7a7a1ff800ff4623243 100644 --- a/paddle/fluid/framework/details/fused_broadcast_op_handle.cc +++ b/paddle/fluid/framework/details/fused_broadcast_op_handle.cc @@ -15,14 +15,15 @@ #include "paddle/fluid/framework/details/fused_broadcast_op_handle.h" #include "paddle/fluid/framework/details/container_cast.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { namespace details { void FusedBroadcastOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); if (places_.size() == 1UL) return; diff --git a/paddle/fluid/framework/details/reduce_op_handle.cc b/paddle/fluid/framework/details/reduce_op_handle.cc index 4df42a7d93d19e7852c4b9b74565c5dcd68ea941..b5b052f1a1f56d7732b4155ee63f496dc0d7ae31 100644 --- a/paddle/fluid/framework/details/reduce_op_handle.cc +++ b/paddle/fluid/framework/details/reduce_op_handle.cc @@ -19,7 +19,7 @@ #include "paddle/fluid/framework/details/reduce_and_gather.h" #include "paddle/fluid/framework/details/variable_visitor.h" #include "paddle/fluid/platform/place.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" PADDLE_DEFINE_EXPORTED_bool( cpu_deterministic, false, @@ -46,7 +46,8 @@ void ReduceOpHandle::Wait( } void ReduceOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); if (places_.size() == 1) return; // the input and output may have dummy var. diff --git a/paddle/fluid/framework/details/rpc_op_handle.cc b/paddle/fluid/framework/details/rpc_op_handle.cc index 8d61a103f98be81309d890f25b8ab6f41d5c3f02..39bcf1d0f385f93cdd867e47c8dc8ba40dc263b9 100644 --- a/paddle/fluid/framework/details/rpc_op_handle.cc +++ b/paddle/fluid/framework/details/rpc_op_handle.cc @@ -14,7 +14,7 @@ #include "paddle/fluid/framework/details/rpc_op_handle.h" #include "paddle/fluid/framework/ir/graph.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace paddle { namespace framework { @@ -30,7 +30,8 @@ RPCOpHandle::RPCOpHandle(ir::Node *node, const framework::OpDesc &op_desc, place_(place) {} void RPCOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event( + Name(), platform::TracerEventType::Communication, 1); for (auto *in : inputs_) { auto &p = static_cast(in)->place(); diff --git a/paddle/fluid/framework/details/scale_loss_grad_op_handle.cc b/paddle/fluid/framework/details/scale_loss_grad_op_handle.cc index 3d877dbbde248c96d392099fe3cdf7948ea53adf..23e96875daa3d546587719e2a33cfe5dfbdd33eb 100644 --- a/paddle/fluid/framework/details/scale_loss_grad_op_handle.cc +++ b/paddle/fluid/framework/details/scale_loss_grad_op_handle.cc @@ -16,7 +16,7 @@ #include -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" namespace pten { class DenseTensor; @@ -88,7 +88,8 @@ std::string ScaleLossGradOpHandle::LossGradName() const { } void ScaleLossGradOpHandle::RunImpl() { - platform::RecordEvent record_event(Name()); + platform::RecordEvent record_event(Name(), + platform::TracerEventType::UserDefined, 2); RunOnVar(local_exec_scopes_[0]->FindVar(LossGradName()), true); } diff --git a/paddle/fluid/pybind/tensor_py.h b/paddle/fluid/pybind/tensor_py.h index f1983175bdf94fa6e9fcee49e6f85e7bdf6f4765..051f58da3931af7cd0a33f1cbadccf29d32b2e8c 100644 --- a/paddle/fluid/pybind/tensor_py.h +++ b/paddle/fluid/pybind/tensor_py.h @@ -35,7 +35,7 @@ limitations under the License. */ #include "paddle/fluid/framework/convert_utils.h" #include "paddle/fluid/platform/device_context.h" #include "paddle/fluid/platform/float16.h" -#include "paddle/fluid/platform/profiler.h" +#include "paddle/fluid/platform/profiler/event_tracing.h" #include "pybind11/numpy.h" #include "pybind11/pybind11.h"