未验证 提交 a97b3630 编写于 作者: J jakpiase 提交者: GitHub

fix for missing reorders in profiling (#47777)

上级 fb16fea3
...@@ -60,10 +60,6 @@ inline void AddSubNonBroadcast(platform::ReorderMKLDNNHandler* reorder_handler, ...@@ -60,10 +60,6 @@ inline void AddSubNonBroadcast(platform::ReorderMKLDNNHandler* reorder_handler,
reorder_attr.set_output_scales(0, scales); reorder_attr.set_output_scales(0, scales);
auto reorder_p = auto reorder_p =
reorder_handler->AcquireReorder(dst_memory, src_memory, reorder_attr); reorder_handler->AcquireReorder(dst_memory, src_memory, reorder_attr);
platform::RecordEvent record_reorder("int_reorder",
platform::TracerEventType::UserDefined,
2,
platform::EventRole::kUniqueOp);
reorder_p->execute(platform::MKLDNNDeviceContext::tls().get_stream(), reorder_p->execute(platform::MKLDNNDeviceContext::tls().get_stream(),
*src_memory, *src_memory,
......
...@@ -292,7 +292,7 @@ class ConvTransposeMKLDNNHandlerT ...@@ -292,7 +292,7 @@ class ConvTransposeMKLDNNHandlerT
platform::RecordEvent record_reorder( platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
platform::TracerEventType::UserDefined, platform::TracerEventType::UserDefined,
2, 1,
platform::EventRole::kUniqueOp); platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
...@@ -318,7 +318,7 @@ class ConvTransposeMKLDNNHandlerT ...@@ -318,7 +318,7 @@ class ConvTransposeMKLDNNHandlerT
platform::RecordEvent record_reorder( platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
platform::TracerEventType::UserDefined, platform::TracerEventType::UserDefined,
2, 1,
platform::EventRole::kUniqueOp); platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
......
...@@ -210,10 +210,17 @@ class FCMKLDNNHandler ...@@ -210,10 +210,17 @@ class FCMKLDNNHandler
*user_memory_p, *target_memory_p, attrs); *user_memory_p, *target_memory_p, attrs);
auto& astream = platform::MKLDNNDeviceContext::tls().get_stream(); auto& astream = platform::MKLDNNDeviceContext::tls().get_stream();
reorder_p->execute( {
astream, platform::RecordEvent record_reorder(
{{DNNL_ARG_FROM, *user_memory_p}, {DNNL_ARG_TO, *target_memory_p}}); "int_reorder",
astream.wait(); platform::TracerEventType::UserDefined,
1,
platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
{{DNNL_ARG_FROM, *user_memory_p}, {DNNL_ARG_TO, *target_memory_p}});
astream.wait();
}
return target_memory_p; return target_memory_p;
} }
......
...@@ -380,7 +380,7 @@ class OneDNNHandlerT { ...@@ -380,7 +380,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
...@@ -433,7 +433,7 @@ class OneDNNHandlerT { ...@@ -433,7 +433,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
...@@ -459,7 +459,7 @@ class OneDNNHandlerT { ...@@ -459,7 +459,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
...@@ -647,7 +647,7 @@ class OneDNNHandlerNoCachingT { ...@@ -647,7 +647,7 @@ class OneDNNHandlerNoCachingT {
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
...@@ -678,7 +678,7 @@ class OneDNNHandlerNoCachingT { ...@@ -678,7 +678,7 @@ class OneDNNHandlerNoCachingT {
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, astream,
......
...@@ -143,7 +143,7 @@ void ConvGradKernel(const Context& dev_ctx, ...@@ -143,7 +143,7 @@ void ConvGradKernel(const Context& dev_ctx,
paddle::platform::RecordEvent record_reorder( paddle::platform::RecordEvent record_reorder(
"int_reorder", "int_reorder",
paddle::platform::TracerEventType::UserDefined, paddle::platform::TracerEventType::UserDefined,
2, 1,
paddle::platform::EventRole::kUniqueOp); paddle::platform::EventRole::kUniqueOp);
reorder_p->execute( reorder_p->execute(
astream, *diff_weights_memory_p, *reorder_dst_memory_p); astream, *diff_weights_memory_p, *reorder_dst_memory_p);
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册