Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
Paddle
提交
fe8c6796
P
Paddle
项目概览
PaddlePaddle
/
Paddle
1 年多 前同步成功
通知
2305
Star
20932
Fork
5423
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1423
列表
看板
标记
里程碑
合并请求
543
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1,423
Issue
1,423
列表
看板
标记
里程碑
合并请求
543
合并请求
543
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
fe8c6796
编写于
11月 02, 2022
作者:
Y
YuanRisheng
提交者:
GitHub
11月 02, 2022
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
[PHI]Standardise some C++ API (Part3) (#47532)
* Standardise batch norm * standardize conv3d and depwise_conv2d * fix ci bugs
上级
cad2e68d
变更
52
隐藏空白更改
内联
并排
Showing
52 changed file
with
217 addition
and
361 deletion
+217
-361
paddle/fluid/operators/inplace_abn_op.cc
paddle/fluid/operators/inplace_abn_op.cc
+3
-7
paddle/fluid/operators/inplace_abn_op.cu
paddle/fluid/operators/inplace_abn_op.cu
+6
-11
paddle/phi/api/yaml/legacy_backward.yaml
paddle/phi/api/yaml/legacy_backward.yaml
+36
-36
paddle/phi/api/yaml/legacy_ops.yaml
paddle/phi/api/yaml/legacy_ops.yaml
+6
-6
paddle/phi/api/yaml/sparse_backward.yaml
paddle/phi/api/yaml/sparse_backward.yaml
+4
-4
paddle/phi/api/yaml/sparse_ops.yaml
paddle/phi/api/yaml/sparse_ops.yaml
+2
-2
paddle/phi/infermeta/binary.cc
paddle/phi/infermeta/binary.cc
+0
-6
paddle/phi/infermeta/binary.h
paddle/phi/infermeta/binary.h
+0
-6
paddle/phi/infermeta/multiary.cc
paddle/phi/infermeta/multiary.cc
+8
-10
paddle/phi/infermeta/multiary.h
paddle/phi/infermeta/multiary.h
+5
-6
paddle/phi/kernels/batch_norm_grad_kernel.h
paddle/phi/kernels/batch_norm_grad_kernel.h
+0
-3
paddle/phi/kernels/batch_norm_kernel.cc
paddle/phi/kernels/batch_norm_kernel.cc
+5
-6
paddle/phi/kernels/batch_norm_kernel.h
paddle/phi/kernels/batch_norm_kernel.h
+5
-6
paddle/phi/kernels/conv_grad_kernel.h
paddle/phi/kernels/conv_grad_kernel.h
+16
-25
paddle/phi/kernels/conv_kernel.h
paddle/phi/kernels/conv_kernel.h
+0
-7
paddle/phi/kernels/cpu/batch_norm_grad_kernel.cc
paddle/phi/kernels/cpu/batch_norm_grad_kernel.cc
+0
-4
paddle/phi/kernels/cpu/batch_norm_kernel.cc
paddle/phi/kernels/cpu/batch_norm_kernel.cc
+3
-4
paddle/phi/kernels/cpu/conv_grad_kernel.cc
paddle/phi/kernels/cpu/conv_grad_kernel.cc
+18
-27
paddle/phi/kernels/cpu/conv_kernel.cc
paddle/phi/kernels/cpu/conv_kernel.cc
+0
-7
paddle/phi/kernels/gpu/batch_norm_grad_kernel.cu
paddle/phi/kernels/gpu/batch_norm_grad_kernel.cu
+0
-4
paddle/phi/kernels/gpu/batch_norm_kernel.cu
paddle/phi/kernels/gpu/batch_norm_kernel.cu
+3
-4
paddle/phi/kernels/gpu/conv_grad_kernel.cu
paddle/phi/kernels/gpu/conv_grad_kernel.cu
+0
-3
paddle/phi/kernels/gpu/conv_kernel.cu
paddle/phi/kernels/gpu/conv_kernel.cu
+0
-3
paddle/phi/kernels/gpu/depthwise_conv_grad_kernel.cu
paddle/phi/kernels/gpu/depthwise_conv_grad_kernel.cu
+7
-4
paddle/phi/kernels/gpu/depthwise_conv_kernel.cu
paddle/phi/kernels/gpu/depthwise_conv_kernel.cu
+8
-4
paddle/phi/kernels/gpu/sync_batch_norm_grad_kernel.cu
paddle/phi/kernels/gpu/sync_batch_norm_grad_kernel.cu
+0
-1
paddle/phi/kernels/gpu/sync_batch_norm_kernel.cu
paddle/phi/kernels/gpu/sync_batch_norm_kernel.cu
+3
-4
paddle/phi/kernels/gpudnn/conv_grad_kernel.cu
paddle/phi/kernels/gpudnn/conv_grad_kernel.cu
+10
-20
paddle/phi/kernels/gpudnn/conv_kernel.cu
paddle/phi/kernels/gpudnn/conv_kernel.cu
+0
-7
paddle/phi/kernels/sparse/batch_norm_grad_kernel.cc
paddle/phi/kernels/sparse/batch_norm_grad_kernel.cc
+0
-2
paddle/phi/kernels/sparse/batch_norm_grad_kernel.h
paddle/phi/kernels/sparse/batch_norm_grad_kernel.h
+0
-1
paddle/phi/kernels/sparse/batch_norm_kernel.cc
paddle/phi/kernels/sparse/batch_norm_kernel.cc
+6
-8
paddle/phi/kernels/sparse/batch_norm_kernel.h
paddle/phi/kernels/sparse/batch_norm_kernel.h
+0
-1
paddle/phi/kernels/sparse/gpu/sync_batch_norm_grad_kernel.cu
paddle/phi/kernels/sparse/gpu/sync_batch_norm_grad_kernel.cu
+0
-2
paddle/phi/kernels/sparse/gpu/sync_batch_norm_kernel.cu
paddle/phi/kernels/sparse/gpu/sync_batch_norm_kernel.cu
+6
-8
paddle/phi/kernels/sparse/sync_batch_norm_grad_kernel.h
paddle/phi/kernels/sparse/sync_batch_norm_grad_kernel.h
+0
-1
paddle/phi/kernels/sparse/sync_batch_norm_kernel.h
paddle/phi/kernels/sparse/sync_batch_norm_kernel.h
+3
-4
paddle/phi/kernels/sync_batch_norm_grad_kernel.h
paddle/phi/kernels/sync_batch_norm_grad_kernel.h
+0
-1
paddle/phi/kernels/sync_batch_norm_kernel.h
paddle/phi/kernels/sync_batch_norm_kernel.h
+3
-4
paddle/phi/kernels/xpu/batch_norm_grad_kernel.cc
paddle/phi/kernels/xpu/batch_norm_grad_kernel.cc
+0
-1
paddle/phi/kernels/xpu/batch_norm_kernel.cc
paddle/phi/kernels/xpu/batch_norm_kernel.cc
+4
-5
paddle/phi/kernels/xpu/conv_grad_kernel.cc
paddle/phi/kernels/xpu/conv_grad_kernel.cc
+0
-4
paddle/phi/kernels/xpu/conv_kernel.cc
paddle/phi/kernels/xpu/conv_kernel.cc
+0
-4
paddle/phi/ops/compat/batch_norm_sig.cc
paddle/phi/ops/compat/batch_norm_sig.cc
+7
-10
paddle/phi/ops/compat/conv3d_sig.cc
paddle/phi/ops/compat/conv3d_sig.cc
+13
-18
paddle/phi/ops/compat/depthwise_conv2d_sig.cc
paddle/phi/ops/compat/depthwise_conv2d_sig.cc
+7
-16
paddle/phi/ops/compat/sync_batch_norm_sig.cc
paddle/phi/ops/compat/sync_batch_norm_sig.cc
+5
-7
python/paddle/fluid/dygraph/nn.py
python/paddle/fluid/dygraph/nn.py
+3
-4
python/paddle/nn/functional/conv.py
python/paddle/nn/functional/conv.py
+0
-7
python/paddle/nn/functional/norm.py
python/paddle/nn/functional/norm.py
+3
-4
python/paddle/nn/layer/norm.py
python/paddle/nn/layer/norm.py
+3
-4
python/paddle/sparse/nn/layer/norm.py
python/paddle/sparse/nn/layer/norm.py
+6
-8
未找到文件。
paddle/fluid/operators/inplace_abn_op.cc
浏览文件 @
fe8c6796
...
...
@@ -242,7 +242,6 @@ class InplaceABNKernel : public framework::OpKernel<T> {
auto
is_test
=
ctx
.
Attr
<
bool
>
(
"is_test"
);
auto
use_global_stats
=
ctx
.
Attr
<
bool
>
(
"use_global_stats"
);
auto
trainable_statistics
=
ctx
.
Attr
<
bool
>
(
"trainable_statistics"
);
auto
fuse_with_relu
=
ctx
.
Attr
<
bool
>
(
"fuse_with_relu"
);
auto
*
mean_out
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
"MeanOut"
);
auto
*
variance_out
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
"VarianceOut"
);
...
...
@@ -255,17 +254,16 @@ class InplaceABNKernel : public framework::OpKernel<T> {
static_cast
<
const
typename
framework
::
ConvertToPhiContext
<
DeviceContext
>::
TYPE
&>
(
dev_ctx
),
*
x
,
*
scale
,
*
bias
,
*
mean
,
*
variance
,
*
scale
,
*
bias
,
is_test
,
momentum
,
epsilon
,
data_layout
,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
y
,
mean_out
,
variance_out
,
...
...
@@ -315,7 +313,6 @@ class InplaceABNGradKernel : public framework::OpKernel<T> {
auto
is_test
=
ctx
.
Attr
<
bool
>
(
"is_test"
);
auto
use_global_stats
=
ctx
.
Attr
<
bool
>
(
"use_global_stats"
);
auto
trainable_statistics
=
ctx
.
Attr
<
bool
>
(
"trainable_statistics"
);
auto
fuse_with_relu
=
ctx
.
Attr
<
bool
>
(
"fuse_with_relu"
);
auto
*
scale_grad
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
framework
::
GradVarName
(
"Scale"
));
...
...
@@ -361,7 +358,6 @@ class InplaceABNGradKernel : public framework::OpKernel<T> {
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
true
,
d_x
,
scale_grad
,
...
...
paddle/fluid/operators/inplace_abn_op.cu
浏览文件 @
fe8c6796
...
...
@@ -48,7 +48,6 @@ class InplaceABNKernel : public framework::OpKernel<T> {
auto
is_test
=
ctx
.
Attr
<
bool
>
(
"is_test"
);
auto
use_global_stats
=
ctx
.
Attr
<
bool
>
(
"use_global_stats"
);
auto
trainable_statistics
=
ctx
.
Attr
<
bool
>
(
"trainable_statistics"
);
auto
fuse_with_relu
=
ctx
.
Attr
<
bool
>
(
"fuse_with_relu"
);
auto
*
mean_out
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
"MeanOut"
);
auto
*
variance_out
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
"VarianceOut"
);
...
...
@@ -62,17 +61,16 @@ class InplaceABNKernel : public framework::OpKernel<T> {
static_cast
<
const
typename
framework
::
ConvertToPhiContext
<
DeviceContext
>::
TYPE
&>
(
dev_ctx
),
*
x
,
*
scale
,
*
bias
,
*
mean
,
*
variance
,
*
scale
,
*
bias
,
is_test
,
momentum
,
epsilon
,
data_layout
,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
y
,
mean_out
,
variance_out
,
...
...
@@ -85,17 +83,16 @@ class InplaceABNKernel : public framework::OpKernel<T> {
static_cast
<
const
typename
framework
::
ConvertToPhiContext
<
DeviceContext
>::
TYPE
&>
(
dev_ctx
),
*
x
,
*
scale
,
*
bias
,
*
mean
,
*
variance
,
*
scale
,
*
bias
,
is_test
,
momentum
,
epsilon
,
data_layout
,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
y
,
mean_out
,
variance_out
,
...
...
@@ -146,7 +143,6 @@ class InplaceABNGradKernel : public framework::OpKernel<T> {
auto
is_test
=
ctx
.
Attr
<
bool
>
(
"is_test"
);
auto
use_global_stats
=
ctx
.
Attr
<
bool
>
(
"use_global_stats"
);
auto
trainable_statistics
=
ctx
.
Attr
<
bool
>
(
"trainable_statistics"
);
auto
fuse_with_relu
=
ctx
.
Attr
<
bool
>
(
"fuse_with_relu"
);
auto
*
scale_grad
=
ctx
.
Output
<
phi
::
DenseTensor
>
(
framework
::
GradVarName
(
"Scale"
));
...
...
@@ -210,7 +206,6 @@ class InplaceABNGradKernel : public framework::OpKernel<T> {
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
true
,
d_x
,
scale_grad
,
...
...
paddle/phi/api/yaml/legacy_backward.yaml
浏览文件 @
fe8c6796
...
...
@@ -129,8 +129,8 @@
inplace
:
(out_grad -> x_grad)
-
backward_op
:
batch_norm_double_grad
forward
:
batch_norm_grad (Tensor x, Tensor scale, Tensor bias, Tensor out_mean, Tensor out_variance, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor grad_out, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
) -> Tensor(grad_x), Tensor(grad_scale), Tensor(grad_bias)
args
:
(Tensor x, Tensor scale, Tensor out_mean, Tensor out_variance, Tensor saved_mean, Tensor saved_variance, Tensor grad_out, Tensor grad_x_grad, Tensor grad_scale_grad, Tensor grad_bias_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
)
forward
:
batch_norm_grad (Tensor x, Tensor scale, Tensor bias, Tensor out_mean, Tensor out_variance, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor grad_out, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics) -> Tensor(grad_x), Tensor(grad_scale), Tensor(grad_bias)
args
:
(Tensor x, Tensor scale, Tensor out_mean, Tensor out_variance, Tensor saved_mean, Tensor saved_variance, Tensor grad_out, Tensor grad_x_grad, Tensor grad_scale_grad, Tensor grad_bias_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics)
output
:
Tensor(x_grad), Tensor(scale_grad), Tensor(grad_out_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
...
...
@@ -142,8 +142,8 @@
inplace
:
(grad_out -> grad_out_grad)
-
backward_op
:
batch_norm_grad
forward
:
batch_norm (Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor mean_out, Tensor variance_out, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
)
forward
:
batch_norm (Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor mean_out, Tensor variance_out, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics)
output
:
Tensor(x_grad), Tensor(scale_grad), Tensor(bias_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
...
...
@@ -345,9 +345,21 @@
use_gpudnn
:
true
backward
:
conv2d_transpose_double_grad
-
backward_op
:
conv3d_double_grad
forward
:
conv3d_grad (Tensor input, Tensor filter, Tensor grad_out, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format) -> Tensor(grad_input), Tensor(grad_filter)
args
:
(Tensor input, Tensor filter, Tensor grad_out, Tensor grad_input_grad, Tensor grad_filter_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format)
output
:
Tensor(input_grad), Tensor(filter_grad), Tensor(grad_out_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
param
:
[
input
,
filter
,
grad_out
]
kernel
:
func
:
conv3d_double_grad
use_gpudnn
:
true
optional
:
grad_input_grad, grad_filter_grad
-
backward_op
:
conv3d_grad
forward
:
conv3d (Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format
, bool use_addto, int workspace_size_MB, bool exhaustive_search
) -> Tensor(out)
args
:
(Tensor input, Tensor filter, Tensor out_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format
, bool use_addto, int workspace_size_MB, bool exhaustive_search
)
forward
:
conv3d (Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format) -> Tensor(out)
args
:
(Tensor input, Tensor filter, Tensor out_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format)
output
:
Tensor(input_grad), Tensor(filter_grad)
infer_meta
:
func
:
GeneralBinaryGradInferMeta
...
...
@@ -355,19 +367,7 @@
kernel
:
func
:
conv3d_grad
use_gpudnn
:
true
backward
:
conv3d_grad_grad
-
backward_op
:
conv3d_grad_grad
forward
:
conv3d_grad (Tensor input, Tensor filter, Tensor grad_out, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_addto, int workspace_size_MB, bool exhaustive_search) -> Tensor(grad_input), Tensor(grad_filter)
args
:
(Tensor input, Tensor filter, Tensor grad_out, Tensor grad_input_grad, Tensor grad_filter_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_addto, int workspace_size_MB, bool exhaustive_search)
output
:
Tensor(input_grad), Tensor(filter_grad), Tensor(grad_out_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
param
:
[
input
,
filter
,
grad_out
]
kernel
:
func
:
conv3d_grad_grad
use_gpudnn
:
true
optional
:
grad_input_grad, grad_filter_grad
backward
:
conv3d_double_grad
-
backward_op
:
conv3d_transpose_grad
forward
:
conv3d_transpose(Tensor x, Tensor filter, int[] strides, int[] paddings, int[] output_padding, int[] output_size, str padding_algorithm, int groups, int[] dilations, str data_format) -> Tensor(out)
...
...
@@ -427,29 +427,29 @@
data_type
:
x
optional
:
mask
-
backward_op
:
depthwise_conv2d_double_grad
forward
:
depthwise_conv2d_grad (Tensor input, Tensor filter, Tensor grad_out, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_gpudnn) -> Tensor(grad_input), Tensor(grad_filter)
args
:
(Tensor input, Tensor filter, Tensor grad_out, Tensor grad_input_grad, Tensor grad_filter_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format)
output
:
Tensor(input_grad), Tensor(filter_grad), Tensor(grad_out_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
param
:
[
input
,
filter
,
grad_out
]
kernel
:
func
:
depthwise_conv2d_double_grad
optional
:
grad_input_grad, grad_filter_grad
-
backward_op
:
depthwise_conv2d_grad
forward
:
depthwise_conv2d (Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_
addto, int workspace_size_MB, bool exhaustive_search, bool fuse_relu, bool use_
gpudnn) -> Tensor(out)
args
:
(Tensor input, Tensor filter, Tensor out_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_
addto, int workspace_size_MB, bool exhaustive_search, bool fuse_relu, bool use_
gpudnn)
forward
:
depthwise_conv2d (Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_gpudnn) -> Tensor(out)
args
:
(Tensor input, Tensor filter, Tensor out_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_gpudnn)
output
:
Tensor(input_grad), Tensor(filter_grad)
infer_meta
:
func
:
GeneralBinaryGradInferMeta
param
:
[
input
,
filter
]
kernel
:
func
:
depthwise_conv2d_grad
param
:
[
input
,
filter
,
out_grad
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
,
use_addto
,
workspace_size_MB
,
exhaustive_search
,
fuse_relu
]
param
:
[
input
,
filter
,
out_grad
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
]
use_gpudnn
:
use_gpudnn
backward
:
depthwise_conv2d_grad_grad
-
backward_op
:
depthwise_conv2d_grad_grad
forward
:
depthwise_conv2d_grad (Tensor input, Tensor filter, Tensor grad_out, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_addto, int workspace_size_MB, bool exhaustive_search, bool fuse_relu, bool use_gpudnn) -> Tensor(grad_input), Tensor(grad_filter)
args
:
(Tensor input, Tensor filter, Tensor grad_out, Tensor grad_input_grad, Tensor grad_filter_grad, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_addto, int workspace_size_MB, bool exhaustive_search, bool fuse_relu)
output
:
Tensor(input_grad), Tensor(filter_grad), Tensor(grad_out_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
param
:
[
input
,
filter
,
grad_out
]
kernel
:
func
:
depthwise_conv2d_grad_grad
optional
:
grad_input_grad, grad_filter_grad
backward
:
depthwise_conv2d_double_grad
-
backward_op
:
depthwise_conv2d_transpose_grad
forward
:
depthwise_conv2d_transpose(Tensor x, Tensor filter, int[] strides, int[] paddings, int[] output_padding, IntArray output_size, str padding_algorithm, int groups, int[] dilations, str data_format) -> Tensor(out)
...
...
@@ -2091,8 +2091,8 @@
inplace
:
(out_grad -> x_grad)
-
backward_op
:
sync_batch_norm_grad
forward
:
sync_batch_norm_ (Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
)
forward
:
sync_batch_norm_ (Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics)
output
:
Tensor(x_grad), Tensor(scale_grad), Tensor(bias_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
...
...
paddle/phi/api/yaml/legacy_ops.yaml
浏览文件 @
fe8c6796
...
...
@@ -254,7 +254,7 @@
inplace
:
(in_sum_1 -> out_sum_1), (in_sum_2 -> out_sum_2), (in_sum_3 -> out_sum_3), (in_num_accumulates -> out_num_accumulates), (in_old_num_accumulates -> out_old_num_accumulates), (in_num_updates -> out_num_updates)
-
op
:
batch_norm
args
:
(Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
)
args
:
(Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
)
output
:
Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
infer_meta
:
func
:
BatchNormInferMeta
...
...
@@ -464,7 +464,7 @@
backward
:
conv2d_transpose_grad
-
op
:
conv3d
args
:
(Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format
, bool use_addto, int workspace_size_MB, bool exhaustive_search
)
args
:
(Tensor input, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format)
output
:
Tensor
infer_meta
:
func
:
Conv3DInferMeta
...
...
@@ -551,14 +551,14 @@
backward
:
deformable_conv_grad
-
op
:
depthwise_conv2d
args
:
(Tensor x, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_
addto, int workspace_size_MB, bool exhaustive_search, bool fuse_relu, bool use_
gpudnn)
args
:
(Tensor x, Tensor filter, int[] strides, int[] paddings, str padding_algorithm, int groups, int[] dilations, str data_format, bool use_gpudnn)
output
:
Tensor(out)
infer_meta
:
func
:
DepthwiseConvInferMeta
param
:
[
x
,
filter
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
,
use_addto
,
workspace_size_MB
,
exhaustive_search
]
param
:
[
x
,
filter
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
]
kernel
:
func
:
depthwise_conv2d
param
:
[
x
,
filter
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
,
use_addto
,
workspace_size_MB
,
exhaustive_search
,
fuse_relu
]
param
:
[
x
,
filter
,
strides
,
paddings
,
padding_algorithm
,
groups
,
dilations
,
data_format
]
use_gpudnn
:
use_gpudnn
backward
:
depthwise_conv2d_grad
...
...
@@ -2373,7 +2373,7 @@
backward
:
swish_grad
-
op
:
sync_batch_norm_
args
:
(Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
)
args
:
(Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
)
output
:
Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
infer_meta
:
func
:
BatchNormInferMeta
...
...
paddle/phi/api/yaml/sparse_backward.yaml
浏览文件 @
fe8c6796
...
...
@@ -101,8 +101,8 @@
atanh_csr_grad {sparse_csr, sparse_csr -> sparse_csr}
-
backward_op
:
batch_norm_grad
forward
:
batch_norm (Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor mean_out, Tensor variance_out, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
)
forward
:
batch_norm (Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor mean_out, Tensor variance_out, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics)
output
:
Tensor(x_grad), Tensor(scale_grad), Tensor(bias_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
...
...
@@ -368,8 +368,8 @@
subtract_csr_csr_grad{sparse_csr, sparse_csr, sparse_csr -> sparse_csr, sparse_csr}
-
backward_op
:
sync_batch_norm_grad
forward
:
sync_batch_norm_(Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics
, bool fuse_with_relu
)
forward
:
sync_batch_norm_(Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
) -> Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
args
:
(Tensor x, Tensor scale, Tensor bias, Tensor saved_mean, Tensor saved_variance, Tensor reserve_space, Tensor out_grad, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics)
output
:
Tensor(x_grad), Tensor(scale_grad), Tensor(bias_grad)
infer_meta
:
func
:
GeneralTernaryGradInferMeta
...
...
paddle/phi/api/yaml/sparse_ops.yaml
浏览文件 @
fe8c6796
...
...
@@ -88,7 +88,7 @@
backward
:
atanh_grad
-
op
:
batch_norm
args
:
(Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
)
args
:
(Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
)
output
:
Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
infer_meta
:
func
:
BatchNormInferMeta
...
...
@@ -324,7 +324,7 @@
backward
:
subtract_grad
-
op
:
sync_batch_norm_
args
:
(Tensor x, Tensor
scale, Tensor bias, Tensor mean, Tensor variance, float momentum, float epsilon, str data_layout, bool is_test, bool use_global_stats, bool trainable_statistics, bool fuse_with_relu
)
args
:
(Tensor x, Tensor
mean, Tensor variance, Tensor scale, Tensor bias, bool is_test, float momentum, float epsilon, str data_layout, bool use_global_stats, bool trainable_statistics
)
output
:
Tensor(out), Tensor(mean_out), Tensor(variance_out), Tensor(saved_mean), Tensor(saved_variance), Tensor(reserve_space)
infer_meta
:
func
:
BatchNormInferMeta
...
...
paddle/phi/infermeta/binary.cc
浏览文件 @
fe8c6796
...
...
@@ -564,9 +564,6 @@ void Conv3DInferMeta(const MetaTensor& input,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
MetaTensor
*
out
,
MetaConfig
config
)
{
ConvInferMeta
(
input
,
...
...
@@ -927,9 +924,6 @@ void DepthwiseConvInferMeta(const MetaTensor& input,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
MetaTensor
*
out
,
MetaConfig
config
)
{
ConvInferMeta
(
input
,
...
...
paddle/phi/infermeta/binary.h
浏览文件 @
fe8c6796
...
...
@@ -95,9 +95,6 @@ void Conv3DInferMeta(const MetaTensor& input,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
MetaTensor
*
out
,
MetaConfig
config
=
MetaConfig
());
...
...
@@ -151,9 +148,6 @@ void DepthwiseConvInferMeta(const MetaTensor& input,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
MetaTensor
*
out
,
MetaConfig
config
=
MetaConfig
());
...
...
paddle/phi/infermeta/multiary.cc
浏览文件 @
fe8c6796
...
...
@@ -534,17 +534,16 @@ void AverageAccumulatesInferMeta(const MetaTensor& param,
}
void
BatchNormInferMeta
(
const
MetaTensor
&
x
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
const
MetaTensor
&
mean
,
const
MetaTensor
&
variance
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout_str
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
MetaTensor
*
y
,
MetaTensor
*
mean_out
,
MetaTensor
*
variance_out
,
...
...
@@ -646,10 +645,10 @@ void BatchNormInferMeta(const MetaTensor& x,
}
void
BatchNormInferInferMeta
(
const
MetaTensor
&
x
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
const
MetaTensor
&
mean
,
const
MetaTensor
&
variance
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
...
...
@@ -658,17 +657,16 @@ void BatchNormInferInferMeta(const MetaTensor& x,
MetaTensor
*
variance_out
,
MetaConfig
config
)
{
BatchNormInferMeta
(
x
,
scale
,
bias
,
mean
,
variance
,
scale
,
bias
,
/*is_test=*/
true
,
momentum
,
epsilon
,
data_layout
,
/*is_test=*/
true
,
/*use_global_stats=*/
false
,
/*trainable_statistics=*/
false
,
/*fuse_with_relu=*/
false
,
y
,
mean_out
,
variance_out
,
...
...
paddle/phi/infermeta/multiary.h
浏览文件 @
fe8c6796
...
...
@@ -158,17 +158,16 @@ void AverageAccumulatesInferMeta(const MetaTensor& param,
MetaTensor
*
out_num_updates
);
void
BatchNormInferMeta
(
const
MetaTensor
&
x
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
const
MetaTensor
&
mean
,
const
MetaTensor
&
variance
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
MetaTensor
*
y
,
MetaTensor
*
mean_out
,
MetaTensor
*
variance_out
,
...
...
@@ -178,10 +177,10 @@ void BatchNormInferMeta(const MetaTensor& x,
MetaConfig
config
=
MetaConfig
());
void
BatchNormInferInferMeta
(
const
MetaTensor
&
x
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
const
MetaTensor
&
mean
,
const
MetaTensor
&
variance
,
const
MetaTensor
&
scale
,
const
MetaTensor
&
bias
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
...
...
paddle/phi/kernels/batch_norm_grad_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -37,7 +37,6 @@ void BatchNormGradRawKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
bool
is_inplace
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
...
...
@@ -60,7 +59,6 @@ void BatchNormGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
);
...
...
@@ -83,7 +81,6 @@ void BatchNormDoubleGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
y_grad_grad
);
...
...
paddle/phi/kernels/batch_norm_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -22,10 +22,10 @@ namespace phi {
template
<
typename
T
,
typename
Context
>
void
BatchNormInferKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
...
...
@@ -39,17 +39,16 @@ void BatchNormInferKernel(const Context& dev_ctx,
auto
saved_variance
=
phi
::
EmptyLike
<
T
,
Context
>
(
dev_ctx
,
*
variance_out
);
BatchNormKernel
<
T
,
Context
>
(
dev_ctx
,
x
,
scale
,
bias
,
mean
,
variance
,
scale
,
bias
,
/*is_test=*/
true
,
momentum
,
epsilon
,
data_layout
,
/*is_test=*/
true
,
/*use_global_stats=*/
false
,
/*trainable_statistics=*/
false
,
/*fuse_with_relu=*/
false
,
y
,
mean_out
,
variance_out
,
...
...
paddle/phi/kernels/batch_norm_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -23,17 +23,16 @@ namespace phi {
template
<
typename
T
,
typename
Context
>
void
BatchNormKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
@@ -44,10 +43,10 @@ void BatchNormKernel(const Context& dev_ctx,
template
<
typename
T
,
typename
Context
>
void
BatchNormInferKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
...
...
paddle/phi/kernels/conv_grad_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -43,9 +43,6 @@ void Conv3DGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
);
...
...
@@ -60,10 +57,6 @@ void DepthwiseConvGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
);
...
...
@@ -85,23 +78,21 @@ void ConvGradGradKernel(const Context& dev_ctx,
DenseTensor
*
out_grad_grad
);
template
<
typename
T
,
typename
Context
>
void
Conv3DGradGradKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
input
,
const
DenseTensor
&
filter
,
const
DenseTensor
&
out_grad
,
const
paddle
::
optional
<
DenseTensor
>&
input_grad_grad
,
const
paddle
::
optional
<
DenseTensor
>&
filter_grad_grad
,
const
std
::
vector
<
int
>&
strides
,
const
std
::
vector
<
int
>&
paddings
,
const
std
::
string
&
padding_algorithm
,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
);
void
Conv3DDoubleGradKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
input
,
const
DenseTensor
&
filter
,
const
DenseTensor
&
out_grad
,
const
paddle
::
optional
<
DenseTensor
>&
input_grad_grad
,
const
paddle
::
optional
<
DenseTensor
>&
filter_grad_grad
,
const
std
::
vector
<
int
>&
strides
,
const
std
::
vector
<
int
>&
paddings
,
const
std
::
string
&
padding_algorithm
,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
);
}
// namespace phi
paddle/phi/kernels/conv_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -40,9 +40,6 @@ void Conv3DKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
out
);
template
<
typename
T
,
typename
Context
>
...
...
@@ -55,10 +52,6 @@ void DepthwiseConvKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
out
);
}
// namespace phi
paddle/phi/kernels/cpu/batch_norm_grad_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -52,7 +52,6 @@ void BatchNormGradRawKernel(const Context& ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
bool
is_inplace
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
...
...
@@ -310,7 +309,6 @@ void BatchNormGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
@@ -330,7 +328,6 @@ void BatchNormGradKernel(const Context& dev_ctx,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
false
,
x_grad
,
scale_grad
,
...
...
@@ -355,7 +352,6 @@ void BatchNormDoubleGradKernel(const Context& ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
y_grad_grad
)
{
...
...
paddle/phi/kernels/cpu/batch_norm_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -36,17 +36,16 @@ using ConstEigenVectorArrayMap =
template
<
typename
T
,
typename
Context
>
void
BatchNormKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout_str
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/cpu/conv_grad_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -31,10 +31,6 @@ void DepthwiseConvGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
ConvGradKernel
<
T
>
(
dev_ctx
,
...
...
@@ -62,9 +58,6 @@ void Conv3DGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
ConvGradKernel
<
T
>
(
dev_ctx
,
...
...
@@ -82,24 +75,22 @@ void Conv3DGradKernel(const Context& dev_ctx,
}
template
<
typename
T
,
typename
Context
>
void
Conv3DGradGradKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
input
,
const
DenseTensor
&
filter
,
const
DenseTensor
&
out_grad
,
const
paddle
::
optional
<
DenseTensor
>&
input_grad_grad
,
const
paddle
::
optional
<
DenseTensor
>&
filter_grad_grad
,
const
std
::
vector
<
int
>&
strides
,
const
std
::
vector
<
int
>&
paddings_t
,
const
std
::
string
&
padding_algorithm
,
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search_t
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
)
{
void
Conv3DDoubleGradKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
input
,
const
DenseTensor
&
filter
,
const
DenseTensor
&
out_grad
,
const
paddle
::
optional
<
DenseTensor
>&
input_grad_grad
,
const
paddle
::
optional
<
DenseTensor
>&
filter_grad_grad
,
const
std
::
vector
<
int
>&
strides
,
const
std
::
vector
<
int
>&
paddings_t
,
const
std
::
string
&
padding_algorithm
,
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
)
{
ConvGradGradKernel
<
T
>
(
ctx
,
input
,
filter
,
...
...
@@ -136,9 +127,9 @@ PD_REGISTER_KERNEL(
conv2d_grad_grad
,
CPU
,
ALL_LAYOUT
,
phi
::
ConvGradGradKernel
,
float
,
double
)
{
}
PD_REGISTER_KERNEL
(
conv3d_
grad
_grad
,
PD_REGISTER_KERNEL
(
conv3d_
double
_grad
,
CPU
,
ALL_LAYOUT
,
phi
::
Conv3D
Grad
GradKernel
,
phi
::
Conv3D
Double
GradKernel
,
float
,
double
)
{}
paddle/phi/kernels/cpu/conv_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -53,10 +53,6 @@ void DepthwiseConvKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
out
)
{
ConvKernelImpl
<
T
>
(
dev_ctx
,
input
,
...
...
@@ -80,9 +76,6 @@ void Conv3DKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
out
)
{
ConvKernelImpl
<
T
>
(
dev_ctx
,
input
,
...
...
paddle/phi/kernels/gpu/batch_norm_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -578,7 +578,6 @@ void BatchNormGradRawKernel(const Context &ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
bool
is_inplace
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
...
...
@@ -1262,7 +1261,6 @@ void BatchNormGradKernel(const Context &dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
@@ -1282,7 +1280,6 @@ void BatchNormGradKernel(const Context &dev_ctx,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
false
,
x_grad
,
scale_grad
,
...
...
@@ -1307,7 +1304,6 @@ void BatchNormDoubleGradKernel(const Context &ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
y_grad_grad
)
{
...
...
paddle/phi/kernels/gpu/batch_norm_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -533,17 +533,16 @@ static __global__ void BNForwardTraining2DWriteRes(
template
<
typename
T
,
typename
Context
>
void
BatchNormKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon_f
,
const
std
::
string
&
data_layout_str
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/gpu/conv_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -31,9 +31,6 @@ void Conv3DGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
ConvGradKernel
<
T
>
(
dev_ctx
,
...
...
paddle/phi/kernels/gpu/conv_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -53,9 +53,6 @@ void Conv3DKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
out
)
{
ConvKernelImpl
<
T
>
(
dev_ctx
,
input
,
...
...
paddle/phi/kernels/gpu/depthwise_conv_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -33,16 +33,19 @@ void DepthwiseConvGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
const
DenseTensor
*
output_grad
=
&
out_grad
;
if
(
!
input_grad
&&
!
filter_grad
)
return
;
bool
has_fuse_relu
=
dev_ctx
.
HasDnnAttr
(
"fuse_relu_before_depthwise_conv"
);
bool
fuse_relu
=
has_fuse_relu
?
PADDLE_GET_CONST
(
bool
,
dev_ctx
.
GetDnnAttr
(
"fuse_relu_before_depthwise_conv"
))
:
false
;
std
::
vector
<
int
>
strides
=
strides_t
;
std
::
vector
<
int
>
paddings
=
paddings_t
;
std
::
vector
<
int
>
dilations
=
dilations_t
;
...
...
paddle/phi/kernels/gpu/depthwise_conv_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -31,10 +31,6 @@ void DepthwiseConvKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
out
)
{
DenseTensor
*
output
=
out
;
output
->
mutable_data
<
T
>
(
dev_ctx
.
GetPlace
());
...
...
@@ -44,6 +40,14 @@ void DepthwiseConvKernel(const Context& dev_ctx,
std
::
vector
<
int
>
paddings
=
paddings_t
;
const
bool
channel_last
=
(
data_format
==
"NHWC"
||
data_format
==
"NDHWC"
);
bool
has_fuse_relu
=
dev_ctx
.
HasDnnAttr
(
"fuse_relu_before_depthwise_conv"
);
bool
fuse_relu
=
has_fuse_relu
?
PADDLE_GET_CONST
(
bool
,
dev_ctx
.
GetDnnAttr
(
"fuse_relu_before_depthwise_conv"
))
:
false
;
if
(
channel_last
)
{
PADDLE_ENFORCE_EQ
(
output
->
dims
()[
output
->
dims
().
size
()
-
1
]
%
...
...
paddle/phi/kernels/gpu/sync_batch_norm_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -34,7 +34,6 @@ void SyncBatchNormGradKernel(const Context& ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
paddle/phi/kernels/gpu/sync_batch_norm_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -22,17 +22,16 @@ namespace phi {
template
<
typename
T
,
typename
Context
>
void
SyncBatchNormKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon_f
,
const
std
::
string
&
data_layout_str
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/gpudnn/conv_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -603,9 +603,6 @@ void Conv3DCudnnGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
ConvCudnnGradKernel
<
T
>
(
dev_ctx
,
...
...
@@ -1295,10 +1292,6 @@ void DepthwiseConvDoubleGradGPUDNNKernel(
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search_t
,
bool
fuse_relu
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
)
{
...
...
@@ -1320,7 +1313,7 @@ void DepthwiseConvDoubleGradGPUDNNKernel(
}
template
<
typename
T
,
typename
Context
>
void
Conv3DCudnn
Grad
GradKernel
(
void
Conv3DCudnn
Double
GradKernel
(
const
Context
&
ctx
,
const
DenseTensor
&
input
,
const
DenseTensor
&
filter
,
...
...
@@ -1333,9 +1326,6 @@ void Conv3DCudnnGradGradKernel(
int
groups
,
const
std
::
vector
<
int
>&
dilations_t
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search_t
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
,
DenseTensor
*
out_grad_grad
)
{
...
...
@@ -1386,14 +1376,14 @@ PD_REGISTER_KERNEL(conv2d_grad_grad,
float
,
phi
::
dtype
::
float16
)
{}
PD_REGISTER_KERNEL
(
conv3d_
grad
_grad
,
PD_REGISTER_KERNEL
(
conv3d_
double
_grad
,
GPUDNN
,
ALL_LAYOUT
,
phi
::
Conv3DCudnn
Grad
GradKernel
,
phi
::
Conv3DCudnn
Double
GradKernel
,
float
,
phi
::
dtype
::
float16
)
{}
PD_REGISTER_KERNEL
(
depthwise_conv2d_
grad
_grad
,
PD_REGISTER_KERNEL
(
depthwise_conv2d_
double
_grad
,
GPU
,
ALL_LAYOUT
,
phi
::
DepthwiseConvDoubleGradGPUDNNKernel
,
...
...
@@ -1427,16 +1417,16 @@ PD_REGISTER_KERNEL(conv2d_grad_grad,
phi
::
dtype
::
float16
,
phi
::
dtype
::
bfloat16
)
{}
PD_REGISTER_KERNEL
(
conv3d_
grad
_grad
,
PD_REGISTER_KERNEL
(
conv3d_
double
_grad
,
GPUDNN
,
ALL_LAYOUT
,
phi
::
Conv3DCudnn
Grad
GradKernel
,
phi
::
Conv3DCudnn
Double
GradKernel
,
float
,
double
,
phi
::
dtype
::
float16
,
phi
::
dtype
::
bfloat16
)
{}
PD_REGISTER_KERNEL
(
depthwise_conv2d_
grad
_grad
,
PD_REGISTER_KERNEL
(
depthwise_conv2d_
double
_grad
,
GPU
,
ALL_LAYOUT
,
phi
::
DepthwiseConvDoubleGradGPUDNNKernel
,
...
...
@@ -1469,15 +1459,15 @@ PD_REGISTER_KERNEL(conv2d_grad_grad,
double
,
phi
::
dtype
::
float16
)
{}
PD_REGISTER_KERNEL
(
conv3d_
grad
_grad
,
PD_REGISTER_KERNEL
(
conv3d_
double
_grad
,
GPUDNN
,
ALL_LAYOUT
,
phi
::
Conv3DCudnn
Grad
GradKernel
,
phi
::
Conv3DCudnn
Double
GradKernel
,
float
,
double
,
phi
::
dtype
::
float16
)
{}
PD_REGISTER_KERNEL
(
depthwise_conv2d_
grad
_grad
,
PD_REGISTER_KERNEL
(
depthwise_conv2d_
double
_grad
,
GPU
,
ALL_LAYOUT
,
phi
::
DepthwiseConvDoubleGradGPUDNNKernel
,
...
...
paddle/phi/kernels/gpudnn/conv_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -397,9 +397,6 @@ void Conv3DCudnnKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
DenseTensor
*
out
)
{
ConvCudnnKernel
<
T
>
(
dev_ctx
,
input
,
...
...
@@ -423,10 +420,6 @@ void DepthwiseConvCudnnKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
out
)
{
ConvCudnnKernel
<
T
>
(
dev_ctx
,
input
,
...
...
paddle/phi/kernels/sparse/batch_norm_grad_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -38,7 +38,6 @@ void BatchNormCooGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
@@ -61,7 +60,6 @@ void BatchNormCooGradKernel(const Context& dev_ctx,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
x_grad
->
mutable_values
(),
scale_grad
,
bias_grad
);
...
...
paddle/phi/kernels/sparse/batch_norm_grad_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -39,7 +39,6 @@ void BatchNormCooGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
);
...
...
paddle/phi/kernels/sparse/batch_norm_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -23,17 +23,16 @@ namespace sparse {
template
<
typename
T
,
typename
Context
>
void
BatchNormCooKernel
(
const
Context
&
dev_ctx
,
const
SparseCooTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
@@ -43,17 +42,16 @@ void BatchNormCooKernel(const Context& dev_ctx,
EmptyLikeCooKernel
<
T
,
Context
>
(
dev_ctx
,
x
,
y
);
phi
::
BatchNormKernel
<
T
,
Context
>
(
dev_ctx
,
x
.
values
(),
scale
,
bias
,
mean
,
variance
,
scale
,
bias
,
is_test
,
momentum
,
epsilon
,
data_layout
,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
y
->
mutable_values
(),
mean_out
,
variance_out
,
...
...
paddle/phi/kernels/sparse/batch_norm_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -35,7 +35,6 @@ void BatchNormKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/sparse/gpu/sync_batch_norm_grad_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -37,7 +37,6 @@ void SyncBatchNormCooGradKernel(
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
@@ -58,7 +57,6 @@ void SyncBatchNormCooGradKernel(
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
x_grad
->
mutable_values
(),
scale_grad
,
bias_grad
);
...
...
paddle/phi/kernels/sparse/gpu/sync_batch_norm_kernel.cu
浏览文件 @
fe8c6796
...
...
@@ -23,17 +23,16 @@ namespace sparse {
template
<
typename
T
,
typename
Context
>
void
SyncBatchNormCooKernel
(
const
Context
&
dev_ctx
,
const
SparseCooTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
@@ -43,17 +42,16 @@ void SyncBatchNormCooKernel(const Context& dev_ctx,
EmptyLikeCooKernel
<
T
,
Context
>
(
dev_ctx
,
x
,
y
);
phi
::
SyncBatchNormKernel
<
T
,
Context
>
(
dev_ctx
,
x
.
values
(),
scale
,
bias
,
mean
,
variance
,
scale
,
bias
,
is_test
,
momentum
,
epsilon
,
data_layout
,
is_test
,
use_global_stats
,
trainable_statistics
,
fuse_with_relu
,
y
->
mutable_values
(),
mean_out
,
variance_out
,
...
...
paddle/phi/kernels/sparse/sync_batch_norm_grad_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -38,7 +38,6 @@ void SyncBatchNormCooGradKernel(
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
);
...
...
paddle/phi/kernels/sparse/sync_batch_norm_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -25,17 +25,16 @@ namespace sparse {
template
<
typename
T
,
typename
Context
>
void
SyncBatchNormCooKernel
(
const
Context
&
dev_ctx
,
const
SparseCooTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
SparseCooTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/sync_batch_norm_grad_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -35,7 +35,6 @@ void SyncBatchNormGradKernel(const Context& dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
);
...
...
paddle/phi/kernels/sync_batch_norm_kernel.h
浏览文件 @
fe8c6796
...
...
@@ -37,17 +37,16 @@ ccl::CCLComm GetCCLComm(const Place& place, int global_gid = 0);
template
<
typename
T
,
typename
Context
>
void
SyncBatchNormKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout
,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/xpu/batch_norm_grad_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -86,7 +86,6 @@ void BatchNormGradKernel(const Context &dev_ctx,
bool
is_test
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
x_grad
,
DenseTensor
*
scale_grad
,
DenseTensor
*
bias_grad
)
{
...
...
paddle/phi/kernels/xpu/batch_norm_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -23,17 +23,16 @@ namespace phi {
template
<
typename
T
,
typename
Context
>
void
BatchNormKernel
(
const
Context
&
dev_ctx
,
const
DenseTensor
&
x
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
const
DenseTensor
&
mean
,
const
DenseTensor
&
variance
,
const
DenseTensor
&
scale
,
const
DenseTensor
&
bias
,
bool
is_test
,
float
momentum
,
float
epsilon
,
const
std
::
string
&
data_layout_str
,
bool
is_test
,
const
std
::
string
&
data_layout
,
bool
use_global_stats
,
bool
trainable_statistics
,
bool
fuse_with_relu
,
DenseTensor
*
y
,
DenseTensor
*
mean_out
,
DenseTensor
*
variance_out
,
...
...
paddle/phi/kernels/xpu/conv_grad_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -152,10 +152,6 @@ void DepthwiseConvGradKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
input_grad
,
DenseTensor
*
filter_grad
)
{
ConvGradKernel
<
T
,
Context
>
(
dev_ctx
,
...
...
paddle/phi/kernels/xpu/conv_kernel.cc
浏览文件 @
fe8c6796
...
...
@@ -118,10 +118,6 @@ void DepthwiseConvKernel(const Context& dev_ctx,
int
groups
,
const
std
::
vector
<
int
>&
dilations
,
const
std
::
string
&
data_format
,
bool
use_addto
,
int
workspace_size_MB
,
bool
exhaustive_search
,
bool
fuse_relu
,
DenseTensor
*
out
)
{
ConvKernel
<
T
,
Context
>
(
dev_ctx
,
input
,
...
...
paddle/phi/ops/compat/batch_norm_sig.cc
浏览文件 @
fe8c6796
...
...
@@ -33,19 +33,18 @@ KernelSignature BatchNormOpArgumentMapping(const ArgumentMappingContext& ctx) {
if
(
is_test
&&
!
use_global_stats
&&
!
trainable_statistics
&&
!
fuse_with_relu
)
{
return
KernelSignature
(
"batch_norm_infer"
,
{
"X"
,
"
Scale"
,
"Bias"
,
"Mean"
,
"Variance
"
},
{
"X"
,
"
Mean"
,
"Variance"
,
"Scale"
,
"Bias
"
},
{
"momentum"
,
"epsilon"
,
"data_layout"
},
{
"Y"
,
"MeanOut"
,
"VarianceOut"
});
}
else
{
return
KernelSignature
(
"batch_norm"
,
{
"X"
,
"Scale"
,
"Bias"
,
"Mean"
,
"Variance"
},
{
"momentum"
,
{
"X"
,
"Mean"
,
"Variance"
,
"Scale"
,
"Bias"
},
{
"is_test"
,
"momentum"
,
"epsilon"
,
"data_layout"
,
"is_test"
,
"use_global_stats"
,
"trainable_statistics"
,
"fuse_with_relu"
},
"trainable_statistics"
},
{
"Y"
,
"MeanOut"
,
"VarianceOut"
,
...
...
@@ -74,8 +73,7 @@ KernelSignature BatchNormGradOpArgumentMapping(
"data_layout"
,
"is_test"
,
"use_global_stats"
,
"trainable_statistics"
,
"fuse_with_relu"
},
"trainable_statistics"
},
{
"X@GRAD"
,
"Scale@GRAD"
,
"Bias@GRAD"
});
}
...
...
@@ -97,8 +95,7 @@ KernelSignature BatchNormGradGradOpArgumentMapping(
"data_layout"
,
"is_test"
,
"use_global_stats"
,
"trainable_statistics"
,
"fuse_with_relu"
},
"trainable_statistics"
},
{
"DX"
,
"DScale"
,
"DDY"
});
}
...
...
paddle/phi/ops/compat/conv3d_sig.cc
浏览文件 @
fe8c6796
...
...
@@ -19,15 +19,14 @@ namespace phi {
KernelSignature
Conv3dOpArgumentMapping
(
const
ArgumentMappingContext
&
ctx
)
{
return
KernelSignature
(
"conv3d"
,
{
"Input"
,
"Filter"
},
{
"strides"
,
"paddings"
,
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
},
{
"strides"
,
"paddings"
,
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
},
{
"Output"
});
}
...
...
@@ -39,31 +38,27 @@ KernelSignature Conv3dGradOpArgumentMapping(const ArgumentMappingContext& ctx) {
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
},
"data_format"
},
{
"Input@GRAD"
,
"Filter@GRAD"
});
}
KernelSignature
Conv3dDoubleGradOpArgumentMapping
(
const
ArgumentMappingContext
&
ctx
)
{
return
KernelSignature
(
"conv3d_
grad
_grad"
,
return
KernelSignature
(
"conv3d_
double
_grad"
,
{
"Input"
,
"Filter"
,
"DOutput"
,
"DDInput"
,
"DDFilter"
},
{
"strides"
,
"paddings"
,
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
},
"data_format"
},
{
"DInput"
,
"DFilter"
,
"DDOutput"
});
}
}
// namespace phi
PD_REGISTER_BASE_KERNEL_NAME
(
conv3d_grad_grad
,
conv3d_double_grad
);
PD_REGISTER_ARG_MAPPING_FN
(
conv3d
,
phi
::
Conv3dOpArgumentMapping
);
PD_REGISTER_ARG_MAPPING_FN
(
conv3d_grad
,
phi
::
Conv3dGradOpArgumentMapping
);
PD_REGISTER_ARG_MAPPING_FN
(
conv3d_grad_grad
,
...
...
paddle/phi/ops/compat/depthwise_conv2d_sig.cc
浏览文件 @
fe8c6796
...
...
@@ -25,11 +25,7 @@ KernelSignature DepthwiseConv2dOpArgumentMapping(
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
,
"fuse_relu_before_depthwise_conv"
},
"data_format"
},
{
"Output"
});
}
...
...
@@ -42,33 +38,28 @@ KernelSignature DepthwiseConv2dGradOpArgumentMapping(
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
,
"fuse_relu_before_depthwise_conv"
},
"data_format"
},
{
"Input@GRAD"
,
"Filter@GRAD"
});
}
KernelSignature
DepthwiseConv2dDoubleGradOpArgumentMapping
(
const
ArgumentMappingContext
&
ctx
)
{
return
KernelSignature
(
"depthwise_conv2d_
grad
_grad"
,
return
KernelSignature
(
"depthwise_conv2d_
double
_grad"
,
{
"Input"
,
"Filter"
,
"DOutput"
,
"DDInput"
,
"DDFilter"
},
{
"strides"
,
"paddings"
,
"padding_algorithm"
,
"groups"
,
"dilations"
,
"data_format"
,
"use_addto"
,
"workspace_size_MB"
,
"exhaustive_search"
,
"fuse_relu_before_depthwise_conv"
},
"data_format"
},
{
"DInput"
,
"DFilter"
,
"DDOutput"
});
}
}
// namespace phi
PD_REGISTER_BASE_KERNEL_NAME
(
depthwise_conv2d_grad_grad
,
depthwise_conv2d_double_grad
);
PD_REGISTER_ARG_MAPPING_FN
(
depthwise_conv2d
,
phi
::
DepthwiseConv2dOpArgumentMapping
);
PD_REGISTER_ARG_MAPPING_FN
(
depthwise_conv2d_grad
,
...
...
paddle/phi/ops/compat/sync_batch_norm_sig.cc
浏览文件 @
fe8c6796
...
...
@@ -19,14 +19,13 @@ namespace phi {
KernelSignature
SyncBatchNormOpArgumentMapping
(
const
ArgumentMappingContext
&
ctx
)
{
return
KernelSignature
(
"sync_batch_norm"
,
{
"X"
,
"Scale"
,
"Bias"
,
"Mean"
,
"Variance"
},
{
"momentum"
,
{
"X"
,
"Mean"
,
"Variance"
,
"Scale"
,
"Bias"
},
{
"is_test"
,
"momentum"
,
"epsilon"
,
"data_layout"
,
"is_test"
,
"use_global_stats"
,
"trainable_statistics"
,
"fuse_with_relu"
},
"trainable_statistics"
},
{
"Y"
,
"MeanOut"
,
"VarianceOut"
,
...
...
@@ -52,8 +51,7 @@ KernelSignature SyncBatchNormGradOpArgumentMapping(
"data_layout"
,
"is_test"
,
"use_global_stats"
,
"trainable_statistics"
,
"fuse_with_relu"
},
"trainable_statistics"
},
{
"X@GRAD"
,
"Scale@GRAD"
,
"Bias@GRAD"
});
}
...
...
python/paddle/fluid/dygraph/nn.py
浏览文件 @
fe8c6796
...
...
@@ -1533,17 +1533,16 @@ class BatchNorm(layers.Layer):
if
in_dygraph_mode
():
batch_norm_out
,
t1
,
t2
,
t3
,
t4
,
_
=
_C_ops
.
batch_norm
(
input
,
self
.
weight
,
self
.
bias
,
self
.
_mean
,
self
.
_variance
,
self
.
weight
,
self
.
bias
,
not
self
.
training
,
self
.
_momentum
,
self
.
_epsilon
,
self
.
_data_layout
,
not
self
.
training
,
self
.
_use_global_stats
,
self
.
_trainable_statistics
,
False
,
)
return
dygraph_utils
.
_append_activation_in_dygraph
(
batch_norm_out
,
act
=
self
.
_act
,
use_mkldnn
=
self
.
_use_mkldnn
...
...
python/paddle/nn/functional/conv.py
浏览文件 @
fe8c6796
...
...
@@ -172,10 +172,6 @@ def _conv_nd(
groups
,
dilation
,
data_format
,
False
,
-
1
,
False
,
False
,
use_cudnn
,
)
if
bias
is
not
None
:
...
...
@@ -202,9 +198,6 @@ def _conv_nd(
groups
,
dilation
,
data_format
,
False
,
-
1
,
False
,
)
if
bias
is
not
None
:
channel_dim
=
(
...
...
python/paddle/nn/functional/norm.py
浏览文件 @
fe8c6796
...
...
@@ -202,17 +202,16 @@ def batch_norm(
if
in_dygraph_mode
():
batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
_C_ops
.
batch_norm
(
x
,
weight
,
bias
,
running_mean
,
running_var
,
weight
,
bias
,
not
training
,
momentum
,
epsilon
,
data_format
,
not
training
,
use_global_stats
,
trainable_statistics
,
False
,
)
return
dygraph_utils
.
_append_activation_in_dygraph
(
...
...
python/paddle/nn/layer/norm.py
浏览文件 @
fe8c6796
...
...
@@ -1180,15 +1180,14 @@ class SyncBatchNorm(_BatchNormBase):
if
in_dygraph_mode
():
sync_batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
_C_ops
.
sync_batch_norm_
(
x
,
self
.
weight
,
self
.
bias
,
self
.
_mean
,
self
.
_variance
,
self
.
weight
,
self
.
bias
,
not
self
.
training
,
self
.
_momentum
,
self
.
_epsilon
,
self
.
_data_format
,
not
self
.
training
,
False
,
False
,
False
,
)
...
...
python/paddle/sparse/nn/layer/norm.py
浏览文件 @
fe8c6796
...
...
@@ -140,17 +140,16 @@ class BatchNorm(paddle.nn.BatchNorm1D):
if
in_dynamic_mode
():
batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
_C_ops
.
sparse_batch_norm
(
input
,
self
.
weight
,
self
.
bias
,
self
.
_mean
,
self
.
_variance
,
self
.
weight
,
self
.
bias
,
not
self
.
training
,
self
.
_momentum
,
self
.
_epsilon
,
data_format
,
not
self
.
training
,
self
.
_use_global_stats
,
trainable_statistics
,
False
,
)
return
batch_norm_out
else
:
...
...
@@ -324,15 +323,14 @@ class SyncBatchNorm(paddle.nn.SyncBatchNorm):
self
.
_check_data_format
()
sync_batch_norm_out
,
_
,
_
,
_
,
_
,
_
=
_C_ops
.
sparse_sync_batch_norm_
(
x
,
self
.
weight
,
self
.
bias
,
self
.
_mean
,
self
.
_variance
,
self
.
weight
,
self
.
bias
,
not
self
.
training
,
self
.
_momentum
,
self
.
_epsilon
,
self
.
_data_format
,
not
self
.
training
,
False
,
False
,
False
,
)
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录