Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
机器未来
Paddle
提交
d7493df2
P
Paddle
项目概览
机器未来
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
d7493df2
编写于
8月 03, 2021
作者:
L
Li Min
提交者:
GitHub
8月 03, 2021
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[NPU] Support npu op reciprocal and reciprocal grad (#34531)
上级
2d0f3d9b
变更
3
隐藏空白更改
内联
并排
Showing
3 changed file
with
128 addition
and
5 deletion
+128
-5
paddle/fluid/operators/activation_op_npu.cc
paddle/fluid/operators/activation_op_npu.cc
+48
-0
paddle/fluid/operators/mean_op_npu.cc
paddle/fluid/operators/mean_op_npu.cc
+2
-5
python/paddle/fluid/tests/unittests/npu/test_reciprocal_op_npu.py
...addle/fluid/tests/unittests/npu/test_reciprocal_op_npu.py
+78
-0
未找到文件。
paddle/fluid/operators/activation_op_npu.cc
浏览文件 @
d7493df2
...
...
@@ -397,6 +397,40 @@ class HardSigmoidGradNPUKernel : public framework::OpKernel<T> {
}
};
template
<
typename
DeviceContext
,
typename
T
>
class
ReciprocalNPUKernel
:
public
framework
::
OpKernel
<
T
>
{
public:
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
auto
*
x
=
ctx
.
Input
<
Tensor
>
(
"X"
);
auto
*
out
=
ctx
.
Output
<
Tensor
>
(
"Out"
);
auto
place
=
ctx
.
GetPlace
();
out
->
mutable_data
<
T
>
(
place
);
auto
stream
=
ctx
.
template
device_context
<
paddle
::
platform
::
NPUDeviceContext
>()
.
stream
();
const
auto
&
runner
=
NpuOpRunner
(
"Reciprocal"
,
{
*
x
},
{
*
out
},
{});
runner
.
Run
(
stream
);
}
};
template
<
typename
DeviceContext
,
typename
T
>
class
ReciprocalGradNPUKernel
:
public
framework
::
OpKernel
<
T
>
{
public:
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
auto
*
out
=
ctx
.
Input
<
Tensor
>
(
"Out"
);
auto
*
dout
=
ctx
.
Input
<
Tensor
>
(
framework
::
GradVarName
(
"Out"
));
auto
*
dx
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"X"
));
auto
place
=
ctx
.
GetPlace
();
dx
->
mutable_data
<
T
>
(
place
);
auto
stream
=
ctx
.
template
device_context
<
paddle
::
platform
::
NPUDeviceContext
>()
.
stream
();
const
auto
&
runner_dx
=
NpuOpRunner
(
"ReciprocalGrad"
,
{
*
out
,
*
dout
},
{
*
dx
},
{});
runner_dx
.
Run
(
stream
);
}
};
}
// namespace operators
}
// namespace paddle
...
...
@@ -483,3 +517,17 @@ REGISTER_OP_NPU_KERNEL(
ops
::
HardSigmoidGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
HardSigmoidGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
paddle
::
platform
::
float16
>
);
REGISTER_OP_NPU_KERNEL
(
reciprocal
,
ops
::
ReciprocalNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
ReciprocalNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
double
>
,
ops
::
ReciprocalNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
paddle
::
platform
::
float16
>
);
REGISTER_OP_NPU_KERNEL
(
reciprocal_grad
,
ops
::
ReciprocalGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
ReciprocalGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
double
>
,
ops
::
ReciprocalGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
paddle
::
platform
::
float16
>
);
paddle/fluid/operators/mean_op_npu.cc
浏览文件 @
d7493df2
...
...
@@ -91,13 +91,10 @@ class MeanGradNPUKernel : public framework::OpKernel<T> {
namespace
ops
=
paddle
::
operators
;
namespace
plat
=
paddle
::
platform
;
REGISTER_OP_NPU_KERNEL
(
mean
,
ops
::
MeanNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
int
>
,
ops
::
MeanNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
MeanNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
double
>
,
mean
,
ops
::
MeanNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
MeanNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
plat
::
float16
>
)
REGISTER_OP_NPU_KERNEL
(
mean_grad
,
ops
::
MeanGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
int
>
,
mean_grad
,
ops
::
MeanGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
float
>
,
ops
::
MeanGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
double
>
,
ops
::
MeanGradNPUKernel
<
paddle
::
platform
::
NPUDeviceContext
,
plat
::
float16
>
)
python/paddle/fluid/tests/unittests/npu/test_reciprocal_op_npu.py
0 → 100644
浏览文件 @
d7493df2
# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from
__future__
import
print_function
,
division
import
numpy
as
np
import
unittest
import
sys
sys
.
path
.
append
(
".."
)
from
op_test
import
OpTest
,
skip_check_grad_ci
import
paddle
paddle
.
enable_static
()
class
TestNPUReciprocal
(
OpTest
):
def
setUp
(
self
):
self
.
op_type
=
"reciprocal"
self
.
set_npu
()
self
.
init_dtype
()
np
.
random
.
seed
(
1024
)
x
=
np
.
random
.
uniform
(
1
,
2
,
[
11
,
17
]).
astype
(
self
.
dtype
)
out
=
np
.
reciprocal
(
x
)
self
.
inputs
=
{
'X'
:
OpTest
.
np_dtype_to_fluid_dtype
(
x
)}
self
.
outputs
=
{
'Out'
:
out
}
def
test_check_output
(
self
):
self
.
check_output_with_place
(
self
.
place
)
def
test_check_grad
(
self
):
if
self
.
dtype
==
np
.
float16
:
return
self
.
check_grad_with_place
(
self
.
place
,
[
'X'
],
'Out'
,
max_relative_error
=
0.01
)
def
set_npu
(
self
):
self
.
__class__
.
use_npu
=
True
self
.
place
=
paddle
.
NPUPlace
(
0
)
def
init_dtype
(
self
):
self
.
dtype
=
np
.
float32
class
TestNPUReciprocalFp64
(
TestNPUReciprocal
):
def
set_npu
(
self
):
self
.
__class__
.
use_npu
=
True
self
.
place
=
paddle
.
NPUPlace
(
0
)
def
init_dtype
(
self
):
self
.
dtype
=
np
.
float64
@
skip_check_grad_ci
(
reason
=
"The backward test is not supported for float16 type on NPU."
)
class
TestNPUReciprocalFp16
(
TestNPUReciprocal
):
def
set_npu
(
self
):
self
.
__class__
.
use_npu
=
True
self
.
place
=
paddle
.
NPUPlace
(
0
)
self
.
__class__
.
no_need_check_grad
=
True
def
init_dtype
(
self
):
self
.
dtype
=
np
.
float16
if
__name__
==
'__main__'
:
unittest
.
main
()
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录