未验证 提交 a97b3630 编写于 作者: J jakpiase 提交者: GitHub

fix for missing reorders in profiling (#47777)

上级 fb16fea3
......@@ -60,10 +60,6 @@ inline void AddSubNonBroadcast(platform::ReorderMKLDNNHandler* reorder_handler,
reorder_attr.set_output_scales(0, scales);
auto reorder_p =
reorder_handler->AcquireReorder(dst_memory, src_memory, reorder_attr);
platform::RecordEvent record_reorder("int_reorder",
platform::TracerEventType::UserDefined,
2,
platform::EventRole::kUniqueOp);
reorder_p->execute(platform::MKLDNNDeviceContext::tls().get_stream(),
*src_memory,
......
......@@ -292,7 +292,7 @@ class ConvTransposeMKLDNNHandlerT
platform::RecordEvent record_reorder(
"int_reorder",
platform::TracerEventType::UserDefined,
2,
1,
platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......@@ -318,7 +318,7 @@ class ConvTransposeMKLDNNHandlerT
platform::RecordEvent record_reorder(
"int_reorder",
platform::TracerEventType::UserDefined,
2,
1,
platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......
......@@ -210,10 +210,17 @@ class FCMKLDNNHandler
*user_memory_p, *target_memory_p, attrs);
auto& astream = platform::MKLDNNDeviceContext::tls().get_stream();
{
platform::RecordEvent record_reorder(
"int_reorder",
platform::TracerEventType::UserDefined,
1,
platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
{{DNNL_ARG_FROM, *user_memory_p}, {DNNL_ARG_TO, *target_memory_p}});
astream.wait();
}
return target_memory_p;
}
......
......@@ -380,7 +380,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......@@ -433,7 +433,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......@@ -459,7 +459,7 @@ class OneDNNHandlerT {
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......@@ -647,7 +647,7 @@ class OneDNNHandlerNoCachingT {
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......@@ -678,7 +678,7 @@ class OneDNNHandlerNoCachingT {
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream,
......
......@@ -143,7 +143,7 @@ void ConvGradKernel(const Context& dev_ctx,
paddle::platform::RecordEvent record_reorder(
"int_reorder",
paddle::platform::TracerEventType::UserDefined,
2,
1,
paddle::platform::EventRole::kUniqueOp);
reorder_p->execute(
astream, *diff_weights_memory_p, *reorder_dst_memory_p);
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册