Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
magicwindyyd
mindspore
提交
82ae946f
M
mindspore
项目概览
magicwindyyd
/
mindspore
与 Fork 源项目一致
Fork自
MindSpore / mindspore
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
M
mindspore
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
82ae946f
编写于
4年前
作者:
M
mindspore-ci-bot
提交者:
Gitee
4年前
浏览文件
操作
浏览文件
下载
差异文件
!5362 gpu GoogleNet performance optimize
Merge pull request !5362 from VectorSL/slice
上级
23e9ebfa
f95fe92a
变更
2
隐藏空白更改
内联
并排
Showing
2 changed file
with
18 addition
and
39 deletion
+18
-39
mindspore/ccsrc/backend/kernel_compiler/gpu/arrays/slice_gpu_kernel.h
...src/backend/kernel_compiler/gpu/arrays/slice_gpu_kernel.h
+17
-39
mindspore/ccsrc/runtime/device/gpu/kernel_info_setter.h
mindspore/ccsrc/runtime/device/gpu/kernel_info_setter.h
+1
-0
未找到文件。
mindspore/ccsrc/backend/kernel_compiler/gpu/arrays/slice_gpu_kernel.h
浏览文件 @
82ae946f
...
...
@@ -18,6 +18,7 @@
#define MINDSPORE_CCSRC_BACKEND_KERNEL_COMPILER_GPU_SLICE_GPU_KERNEL_H
#include <vector>
#include <utility>
#include "backend/kernel_compiler/gpu/gpu_kernel.h"
#include "backend/kernel_compiler/gpu/gpu_kernel_factory.h"
#include "backend/kernel_compiler/gpu/cuda_impl/slice_impl.cuh"
...
...
@@ -27,8 +28,7 @@ namespace kernel {
template
<
typename
T
>
class
SliceGpuFwdKernel
:
public
GpuKernel
{
public:
SliceGpuFwdKernel
()
:
is_strided_slice_
(
false
),
is_null_input_
(
false
),
input_size_
(
0
),
output_size_
(
0
),
workspace_size_
(
0
)
{}
SliceGpuFwdKernel
()
:
is_null_input_
(
false
),
input_size_
(
0
),
output_size_
(
0
),
workspace_size_
(
0
)
{}
~
SliceGpuFwdKernel
()
override
=
default
;
const
std
::
vector
<
size_t
>
&
GetInputSizeList
()
const
override
{
return
input_size_list_
;
}
const
std
::
vector
<
size_t
>
&
GetOutputSizeList
()
const
override
{
return
output_size_list_
;
}
...
...
@@ -50,51 +50,31 @@ class SliceGpuFwdKernel : public GpuKernel {
if
(
!
CheckParam
(
kernel_node
))
{
return
false
;
}
auto
input_shape
=
AnfAlgo
::
GetPrevNodeOutputInferShape
(
kernel_node
,
0
);
auto
data_format
=
AnfAlgo
::
GetInputFormat
(
kernel_node
,
0
);
auto
input_shape
=
AnfAlgo
::
GetInputDeviceShape
(
kernel_node
,
0
);
ShapeNdTo4d
(
input_shape
,
&
input_shape_
);
auto
strides
=
AnfAlgo
::
GetCNodePrimitive
(
kernel_node
)
->
GetAttr
(
"strides"
);
if
(
strides
)
{
strides_
=
GetAttr
<
std
::
vector
<
int
>>
(
kernel_node
,
"strides"
);
for
(
auto
i
=
strides_
.
size
();
i
<
4
;
i
++
)
{
(
void
)
strides_
.
insert
(
strides_
.
begin
(),
1
);
}
size_
=
GetAttr
<
std
::
vector
<
int
>>
(
kernel_node
,
"end"
);
is_strided_slice_
=
true
;
}
else
{
size_
=
GetAttr
<
std
::
vector
<
int
>>
(
kernel_node
,
"size"
);
}
for
(
auto
i
=
begin_
.
size
();
i
<
4
;
i
++
)
{
(
void
)
begin_
.
insert
(
begin_
.
begin
(),
0
);
}
for
(
size_t
i
=
size_
.
size
();
i
<
4
;
i
++
)
{
(
void
)
size_
.
insert
(
size_
.
begin
(),
1
);
}
for
(
size_t
i
=
0
;
i
<
begin_
.
size
();
i
++
)
{
if
(
begin_
[
i
]
<
0
)
{
begin_
[
i
]
=
begin_
[
i
]
+
input_shape_
[
i
];
}
}
for
(
size_t
i
=
0
;
i
<
size_
.
size
();
i
++
)
{
if
(
size_
[
i
]
<
0
)
{
size_
[
i
]
=
(
size_
[
i
]
+
input_shape_
[
i
])
>
0
?
(
size_
[
i
]
+
input_shape_
[
i
])
:
0
;
}
if
(
begin_
[
i
]
==
size_
[
i
]
&&
is_strided_slice_
)
{
MS_LOG
(
WARNING
)
<<
"Output is null."
;
is_null_input_
=
true
;
}
if
(
size_
[
i
]
==
0
&&
strides_
[
i
]
>
0
)
{
size_
[
i
]
=
begin_
[
i
]
+
1
;
}
}
input_size_
=
IntToSize
(
input_shape_
[
0
]
*
input_shape_
[
1
]
*
input_shape_
[
2
]
*
input_shape_
[
3
])
*
sizeof
(
T
);
auto
out_shape
=
AnfAlgo
::
GetOutput
Infer
Shape
(
kernel_node
,
0
);
auto
out_shape
=
AnfAlgo
::
GetOutput
Device
Shape
(
kernel_node
,
0
);
output_size_
=
sizeof
(
T
);
for
(
size_t
x
:
out_shape
)
{
output_size_
=
output_size_
*
x
;
}
// transpose begin and size for NHWC data
if
(
data_format
==
"NHWC"
)
{
std
::
swap
(
begin_
[
1
],
begin_
[
3
]);
std
::
swap
(
begin_
[
1
],
begin_
[
2
]);
std
::
swap
(
size_
[
1
],
size_
[
3
]);
std
::
swap
(
size_
[
1
],
size_
[
2
]);
}
InitSizeLists
();
return
true
;
}
...
...
@@ -126,26 +106,24 @@ class SliceGpuFwdKernel : public GpuKernel {
MS_LOG
(
ERROR
)
<<
"Input dims is "
<<
input_shape
.
size
()
<<
", scalar is not supported."
;
return
false
;
}
size_
=
GetAttr
<
std
::
vector
<
int
>>
(
kernel_node
,
"size"
);
begin_
=
GetAttr
<
std
::
vector
<
int
>>
(
kernel_node
,
"begin"
);
for
(
size_t
i
=
0
;
i
<
input_shape
.
size
();
i
++
)
{
if
((
begin_
[
i
]
>
0
&&
(
begin_
[
i
]
>
SizeToInt
(
input_shape
[
i
])))
||
(
begin_
[
i
]
<
0
&&
(
std
::
abs
(
begin_
[
i
])
>
SizeToInt
(
input_shape
[
i
]))))
{
MS_LOG
(
INFO
)
<<
"Input out of bounds "
<<
input_shape
[
i
]
<<
" in axis "
<<
i
<<
"."
;
begin_
[
i
]
=
0
;
if
(
input_shape
[
i
]
<=
0
||
size_
[
i
]
<=
0
)
{
MS_LOG
(
WARNING
)
<<
"Slice output is null."
;
is_null_input_
=
true
;
}
}
return
true
;
}
std
::
vector
<
int
>
begin_
;
std
::
vector
<
int
>
size_
;
std
::
vector
<
int
>
strides_
;
std
::
vector
<
int
>
input_shape_
;
std
::
vector
<
size_t
>
input_size_list_
;
std
::
vector
<
size_t
>
output_size_list_
;
std
::
vector
<
size_t
>
workspace_size_list_
;
bool
is_strided_slice_
;
bool
is_null_input_
;
size_t
input_size_
;
size_t
output_size_
;
...
...
This diff is collapsed.
Click to expand it.
mindspore/ccsrc/runtime/device/gpu/kernel_info_setter.h
浏览文件 @
82ae946f
...
...
@@ -39,6 +39,7 @@ static std::map<std::string, std::pair<std::vector<size_t>, std::vector<size_t>>
{
prim
::
kPrimReluGrad
->
name
(),
{{
0
,
1
},
{
0
}}},
{
prim
::
kPrimMaxPool
->
name
(),
{{
0
},
{
0
}}},
{
prim
::
kPrimMaxPoolGrad
->
name
(),
{{
0
,
1
,
2
},
{
0
}}},
{
kSliceOpName
,
{{
0
},
{
0
}}},
{
kAvgPoolOpName
,
{{
0
},
{
0
}}},
{
kAvgPoolGradGpuOpName
,
{{
0
,
1
,
2
},
{
0
}}},
{
kTensorAddOpName
,
{{
0
,
1
},
{
0
}}},
...
...
This diff is collapsed.
Click to expand it.
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录
新手
引导
客服
返回
顶部