Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
MegEngine 天元
MegEngine
提交
2886245b
MegEngine
项目概览
MegEngine 天元
/
MegEngine
1 年多 前同步成功
通知
404
Star
4705
Fork
582
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
MegEngine
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
提交
2886245b
编写于
5月 26, 2022
作者:
M
Megvii Engine Team
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
perf(imperative/src): improve pad host performance
GitOrigin-RevId: 05223deca753dd862e40f6f8a26c1fca56d8e216
上级
b55942a9
变更
4
隐藏空白更改
内联
并排
Showing
4 changed file
with
100 addition
and
19 deletion
+100
-19
dnn/include/megdnn/oprs/general.h
dnn/include/megdnn/oprs/general.h
+4
-0
dnn/src/common/padding.cpp
dnn/src/common/padding.cpp
+19
-10
imperative/src/impl/ops/padding.cpp
imperative/src/impl/ops/padding.cpp
+77
-0
imperative/src/impl/ops/specializations.cpp
imperative/src/impl/ops/specializations.cpp
+0
-9
未找到文件。
dnn/include/megdnn/oprs/general.h
浏览文件 @
2886245b
...
@@ -1406,6 +1406,7 @@ public:
...
@@ -1406,6 +1406,7 @@ public:
protected:
protected:
SmallVector
<
size_t
>
get_offsets
();
SmallVector
<
size_t
>
get_offsets
();
MGE_WIN_DECLSPEC_FUC
static
SmallVector
<
size_t
>
get_offsets_impl
(
const
Param
&
p
);
void
check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
);
void
check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
);
};
};
...
@@ -1421,6 +1422,9 @@ public:
...
@@ -1421,6 +1422,9 @@ public:
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
=
0
;
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
=
0
;
void
deduce_layout
(
const
TensorLayout
&
src
,
TensorLayout
&
dst
);
void
deduce_layout
(
const
TensorLayout
&
src
,
TensorLayout
&
dst
);
MGE_WIN_DECLSPEC_FUC
static
void
deduce_layout_impl
(
const
TensorLayout
&
src
,
TensorLayout
&
dst
,
const
Param
&
p
);
protected:
protected:
void
forward_check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
);
void
forward_check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
);
};
};
...
...
dnn/src/common/padding.cpp
浏览文件 @
2886245b
...
@@ -7,6 +7,7 @@
...
@@ -7,6 +7,7 @@
namespace
megdnn
{
namespace
megdnn
{
using
padding_param
=
megdnn
::
param_enumv
::
Padding
;
using
padding_param
=
megdnn
::
param_enumv
::
Padding
;
using
Param
=
PaddingBase
::
Param
;
void
PaddingForward
::
forward_check_exec
(
void
PaddingForward
::
forward_check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
...
@@ -19,8 +20,9 @@ void PaddingForward::forward_check_exec(
...
@@ -19,8 +20,9 @@ void PaddingForward::forward_check_exec(
"unsupported %s dtype for forward padding opr"
,
src
.
dtype
.
name
());
"unsupported %s dtype for forward padding opr"
,
src
.
dtype
.
name
());
}
}
void
PaddingForward
::
deduce_layout
(
const
TensorLayout
&
src
,
TensorLayout
&
dst
)
{
void
PaddingForward
::
deduce_layout_impl
(
SmallVector
<
size_t
>
offsets
(
get_offsets
());
const
TensorLayout
&
src
,
TensorLayout
&
dst
,
const
Param
&
p
)
{
SmallVector
<
size_t
>
offsets
(
get_offsets_impl
(
p
));
TensorShape
dst_shape
;
TensorShape
dst_shape
;
switch
(
src
.
ndim
)
{
switch
(
src
.
ndim
)
{
case
1
:
case
1
:
...
@@ -76,6 +78,10 @@ void PaddingForward::deduce_layout(const TensorLayout& src, TensorLayout& dst) {
...
@@ -76,6 +78,10 @@ void PaddingForward::deduce_layout(const TensorLayout& src, TensorLayout& dst) {
dst
=
TensorLayout
(
dst_shape
,
src
.
dtype
);
dst
=
TensorLayout
(
dst_shape
,
src
.
dtype
);
}
}
void
PaddingForward
::
deduce_layout
(
const
TensorLayout
&
src
,
TensorLayout
&
dst
)
{
return
deduce_layout_impl
(
src
,
dst
,
param
());
}
void
PaddingBackward
::
backward_check_exec
(
void
PaddingBackward
::
backward_check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
check_exec
(
dst
,
src
);
check_exec
(
dst
,
src
);
...
@@ -86,17 +92,20 @@ void PaddingBackward::backward_check_exec(
...
@@ -86,17 +92,20 @@ void PaddingBackward::backward_check_exec(
"unsupported %s dtype for forward padding opr"
,
src
.
dtype
.
name
());
"unsupported %s dtype for forward padding opr"
,
src
.
dtype
.
name
());
}
}
SmallVector
<
size_t
>
PaddingBase
::
get_offsets
()
{
SmallVector
<
size_t
>
PaddingBase
::
get_offsets_impl
(
const
Param
&
p
)
{
SmallVector
<
size_t
>
offsets
=
{
param
().
front_offset_dim0
,
param
().
back_offset_dim0
,
SmallVector
<
size_t
>
offsets
=
{
param
().
front_offset_dim1
,
param
().
back_offset_dim1
,
p
.
front_offset_dim0
,
p
.
back_offset_dim0
,
p
.
front_offset_dim1
,
param
().
front_offset_dim2
,
param
().
back_offset_dim2
,
p
.
back_offset_dim1
,
p
.
front_offset_dim2
,
p
.
back_offset_dim2
,
param
().
front_offset_dim3
,
param
().
back_offset_dim3
,
p
.
front_offset_dim3
,
p
.
back_offset_dim3
,
p
.
front_offset_dim4
,
param
().
front_offset_dim4
,
param
().
back_offset_dim4
,
p
.
back_offset_dim4
,
p
.
front_offset_dim5
,
p
.
back_offset_dim5
,
param
().
front_offset_dim5
,
param
().
back_offset_dim5
,
p
.
front_offset_dim6
,
p
.
back_offset_dim6
};
param
().
front_offset_dim6
,
param
().
back_offset_dim6
};
return
offsets
;
return
offsets
;
}
}
SmallVector
<
size_t
>
PaddingBase
::
get_offsets
()
{
return
get_offsets_impl
(
param
());
}
void
PaddingBase
::
check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
void
PaddingBase
::
check_exec
(
const
TensorLayout
&
src
,
const
TensorLayout
&
dst
)
{
SmallVector
<
size_t
>
offsets
(
get_offsets
());
SmallVector
<
size_t
>
offsets
(
get_offsets
());
// make sure the src and dst tensor not empty
// make sure the src and dst tensor not empty
...
...
imperative/src/impl/ops/padding.cpp
0 → 100644
浏览文件 @
2886245b
#include "megbrain/graph/symbol_var.h"
#include "megbrain/imperative/ops/autogen.h"
#include "megbrain/imperative/physical_tensor.h"
#include "megbrain/imperative/proxy_graph_detail.h"
#include "megbrain/opr/basic_arith.h"
#include "megbrain/opr/internal/megdnn_opr_wrapper.h"
#include "megbrain/opr/io.h"
#include "megbrain/opr/tensor_manip.h"
#include "megdnn/dtype.h"
#include "../blob_manager_impl.h"
#include "../dnn_op_helper.h"
#include "../op_trait.h"
namespace
mgb
{
namespace
imperative
{
namespace
{
namespace
padding
{
auto
apply_on_var_node
(
const
OpDef
&
def
,
const
VarNodeArray
&
inputs
)
{
auto
&&
op
=
static_cast
<
const
Padding
&>
(
def
);
mgb_assert
(
inputs
.
size
()
==
1
);
return
opr
::
Padding
::
make
(
inputs
[
0
],
op
.
param
());
}
SmallVector
<
TensorPtr
>
apply_on_physical_tensor
(
const
OpDef
&
def
,
const
SmallVector
<
TensorPtr
>&
inputs
,
SmallVector
<
LogicalTensorDesc
>&
output_descs
,
const
bool
&
validated
)
{
auto
comp_node
=
inputs
[
0
]
->
comp_node
();
auto
&&
op_def
=
def
.
cast_final_safe
<
Padding
>
();
DnnOprCaller
<
megdnn
::
Padding
>
dnn_op
(
comp_node
);
dnn_op
.
op
->
param
()
=
op_def
.
param
();
TensorLayout
dst
=
output_descs
[
0
].
layout
;
if
(
!
validated
)
{
megdnn
::
Padding
::
deduce_layout_impl
(
inputs
[
0
]
->
dnn_tensor
().
layout
,
dst
,
op_def
.
param
());
}
DeviceTensorND
out
=
BlobManager
::
inst
()
->
alloc_workspace_with_defrag
(
comp_node
,
dst
);
dnn_op
.
op
->
exec
(
inputs
[
0
]
->
dnn_tensor
(),
out
.
as_megdnn
());
return
{
Tensor
::
make
(
out
)};
}
std
::
tuple
<
SmallVector
<
LogicalTensorDesc
>
,
bool
>
infer_output_attrs_fallible
(
const
OpDef
&
def
,
const
SmallVector
<
LogicalTensorDesc
>&
inputs
)
{
auto
&&
op_def
=
def
.
cast_final_safe
<
Padding
>
();
size_t
nr_inp
=
inputs
.
size
();
auto
p
=
op_def
.
param
();
auto
&&
inp
=
inputs
[
0
];
auto
&
inp_cn
=
inp
.
comp_node
;
if
(
inp
.
layout
.
ndim
==
0
)
{
return
{{{
TensorLayout
{
inp
.
layout
.
dtype
},
inp_cn
,
{}}},
false
};
}
TensorLayout
oup_layout
;
megdnn
::
Padding
::
deduce_layout_impl
(
inp
.
layout
,
oup_layout
,
p
);
return
{{{
oup_layout
,
inp_cn
,
{}}},
true
};
}
OP_TRAIT_REG
(
Padding
,
Padding
,
opr
::
Padding
)
.
apply_on_var_node
(
apply_on_var_node
)
.
apply_on_physical_tensor
(
apply_on_physical_tensor
)
.
infer_output_attrs_fallible
(
infer_output_attrs_fallible
)
.
fallback
();
}
// namespace padding
}
// namespace
}
// namespace imperative
}
// namespace mgb
// vim: syntax=cpp.doxygen foldmethod=marker foldmarker=f{{{,f}}}
\ No newline at end of file
imperative/src/impl/ops/specializations.cpp
浏览文件 @
2886245b
...
@@ -664,15 +664,6 @@ OP_TRAIT_REG(Cumsum, Cumsum).apply_on_var_node(apply_on_var_node).fallback();
...
@@ -664,15 +664,6 @@ OP_TRAIT_REG(Cumsum, Cumsum).apply_on_var_node(apply_on_var_node).fallback();
}
// namespace cumsum
}
// namespace cumsum
}
// namespace
}
// namespace
namespace
padding
{
auto
apply_on_var_node
(
const
OpDef
&
def
,
const
VarNodeArray
&
inputs
)
{
auto
&&
op
=
static_cast
<
const
Padding
&>
(
def
);
mgb_assert
(
inputs
.
size
()
==
1
);
return
opr
::
Padding
::
make
(
inputs
[
0
],
op
.
param
());
}
OP_TRAIT_REG
(
Padding
,
Padding
).
apply_on_var_node
(
apply_on_var_node
).
fallback
();
}
// namespace padding
namespace
lrn
{
namespace
lrn
{
auto
apply_on_var_node
(
const
OpDef
&
def
,
const
VarNodeArray
&
inputs
)
{
auto
apply_on_var_node
(
const
OpDef
&
def
,
const
VarNodeArray
&
inputs
)
{
auto
&&
op
=
static_cast
<
const
LRN
&>
(
def
);
auto
&&
op
=
static_cast
<
const
LRN
&>
(
def
);
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录