Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
BaiXuePrincess
Paddle
提交
b720f282
P
Paddle
项目概览
BaiXuePrincess
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
“f7d64987cf648fbaf8842601e77b5473f1a031ef”上不存在“develop/doc_cn/howto/raspberry/build_for_raspberry.html”
提交
b720f282
编写于
11月 01, 2017
作者:
Z
zchen0211
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
deconv modify
上级
4e228021
变更
3
显示空白变更内容
内联
并排
Showing
3 changed file
with
9 addition
and
12 deletion
+9
-12
paddle/operators/conv2dtranspose_cudnn_op.cc
paddle/operators/conv2dtranspose_cudnn_op.cc
+4
-4
paddle/operators/conv2dtranspose_cudnn_op.cu
paddle/operators/conv2dtranspose_cudnn_op.cu
+3
-5
python/paddle/v2/framework/tests/test_conv2dtranspose_op.py
python/paddle/v2/framework/tests/test_conv2dtranspose_op.py
+2
-3
未找到文件。
paddle/operators/conv2dtranspose_cudnn_op.cc
浏览文件 @
b720f282
...
@@ -38,13 +38,13 @@ class CudnnConv2DTransposeOpMaker : public Conv2DTransposeOpMaker {
...
@@ -38,13 +38,13 @@ class CudnnConv2DTransposeOpMaker : public Conv2DTransposeOpMaker {
}
// namespace paddle
}
// namespace paddle
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
REGISTER_OP
(
conv2dtranspose_cudnn
,
ops
::
Conv2DTransposeOp
,
REGISTER_OP
(
conv2d
_
transpose_cudnn
,
ops
::
Conv2DTransposeOp
,
ops
::
CudnnConv2DTransposeOpMaker
,
conv2dtranspose_cudnn_grad
,
ops
::
CudnnConv2DTransposeOpMaker
,
conv2d
_
transpose_cudnn_grad
,
ops
::
Conv2DTransposeOpGrad
);
ops
::
Conv2DTransposeOpGrad
);
REGISTER_OP_CPU_KERNEL
(
REGISTER_OP_CPU_KERNEL
(
conv2dtranspose_cudnn
,
conv2d
_
transpose_cudnn
,
ops
::
GemmConv2DTransposeKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
ops
::
GemmConv2DTransposeKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
REGISTER_OP_CPU_KERNEL
(
REGISTER_OP_CPU_KERNEL
(
conv2dtranspose_cudnn_grad
,
conv2d
_
transpose_cudnn_grad
,
ops
::
GemmConv2DTransposeGradKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
ops
::
GemmConv2DTransposeGradKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
paddle/operators/conv2dtranspose_cudnn_op.cu
浏览文件 @
b720f282
...
@@ -15,7 +15,7 @@
...
@@ -15,7 +15,7 @@
#include "paddle/framework/eigen.h"
#include "paddle/framework/eigen.h"
#include "paddle/framework/op_registry.h"
#include "paddle/framework/op_registry.h"
#include "paddle/memory/memory.h"
#include "paddle/memory/memory.h"
#include "paddle/operators/conv2d_op.h"
#include "paddle/operators/conv2d
transpose
_op.h"
#include "paddle/platform/assert.h"
#include "paddle/platform/assert.h"
#include "paddle/platform/cudnn_helper.h"
#include "paddle/platform/cudnn_helper.h"
...
@@ -76,7 +76,6 @@ class CudnnConvTransposeOpKernel : public framework::OpKernel<T> {
...
@@ -76,7 +76,6 @@ class CudnnConvTransposeOpKernel : public framework::OpKernel<T> {
workspace_size_limit
=
user_workspace_size
*
1024
*
1024
;
workspace_size_limit
=
user_workspace_size
*
1024
*
1024
;
}
}
// ------------------- cudnn conv algorithm ---------------------
// ------------------- cudnn conv algorithm ---------------------
// cudnnConvolutionBwdAlgo_t algo;
cudnnConvolutionBwdDataAlgo_t
algo
;
cudnnConvolutionBwdDataAlgo_t
algo
;
auto
handle
=
ctx
.
cuda_device_context
().
cudnn_handle
();
auto
handle
=
ctx
.
cuda_device_context
().
cudnn_handle
();
// Get the algorithm
// Get the algorithm
...
@@ -92,7 +91,6 @@ class CudnnConvTransposeOpKernel : public framework::OpKernel<T> {
...
@@ -92,7 +91,6 @@ class CudnnConvTransposeOpKernel : public framework::OpKernel<T> {
platform
::
dynload
::
cudnnGetConvolutionBackwardDataWorkspaceSize
(
platform
::
dynload
::
cudnnGetConvolutionBackwardDataWorkspaceSize
(
handle
,
cudnn_filter_desc
,
cudnn_input_desc
,
cudnn_conv_desc
,
handle
,
cudnn_filter_desc
,
cudnn_input_desc
,
cudnn_conv_desc
,
cudnn_output_desc
,
algo
,
&
workspace_size_in_bytes
));
cudnn_output_desc
,
algo
,
&
workspace_size_in_bytes
));
// workspace_size_in_bytes = std::max(workspace_size_in_bytes, tmp_size);
// Allocate on GPU memory
// Allocate on GPU memory
platform
::
GPUPlace
gpu
=
boost
::
get
<
platform
::
GPUPlace
>
(
ctx
.
GetPlace
());
platform
::
GPUPlace
gpu
=
boost
::
get
<
platform
::
GPUPlace
>
(
ctx
.
GetPlace
());
...
@@ -234,7 +232,7 @@ class CudnnConvTransposeGradOpKernel : public framework::OpKernel<T> {
...
@@ -234,7 +232,7 @@ class CudnnConvTransposeGradOpKernel : public framework::OpKernel<T> {
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
REGISTER_OP_GPU_KERNEL
(
conv2dtranspose_cudnn
,
REGISTER_OP_GPU_KERNEL
(
conv2d
_
transpose_cudnn
,
ops
::
CudnnConvTransposeOpKernel
<
float
>
);
ops
::
CudnnConvTransposeOpKernel
<
float
>
);
REGISTER_OP_GPU_KERNEL
(
conv2dtranspose_cudnn_grad
,
REGISTER_OP_GPU_KERNEL
(
conv2d
_
transpose_cudnn_grad
,
ops
::
CudnnConvTransposeGradOpKernel
<
float
>
);
ops
::
CudnnConvTransposeGradOpKernel
<
float
>
);
python/paddle/v2/framework/tests/test_conv2dtranspose_op.py
浏览文件 @
b720f282
...
@@ -45,13 +45,12 @@ class TestConv2dTransposeOp(OpTest):
...
@@ -45,13 +45,12 @@ class TestConv2dTransposeOp(OpTest):
filter_
=
np
.
random
.
random
(
self
.
filter_size
).
astype
(
"float32"
)
filter_
=
np
.
random
.
random
(
self
.
filter_size
).
astype
(
"float32"
)
output
=
conv2dtranspose_forward_naive
(
output
=
conv2dtranspose_forward_naive
(
input_
,
filter_
,
conv2dtranspose_param
).
astype
(
'float32'
)
input_
,
filter_
,
conv2dtranspose_param
).
astype
(
'float32'
)
# print 'deconv output py', output, output.shape
self
.
inputs
=
{
'Input'
:
input_
,
'Filter'
:
filter_
}
self
.
inputs
=
{
'Input'
:
input_
,
'Filter'
:
filter_
}
self
.
attrs
=
{
self
.
attrs
=
{
'strides'
:
self
.
stride
,
'strides'
:
self
.
stride
,
'paddings'
:
self
.
pad
,
'paddings'
:
self
.
pad
,
#
'dilations': self.dilations
'dilations'
:
self
.
dilations
}
}
self
.
outputs
=
{
'Output'
:
output
}
self
.
outputs
=
{
'Output'
:
output
}
...
@@ -91,7 +90,7 @@ class TestConv2dTransposeOp(OpTest):
...
@@ -91,7 +90,7 @@ class TestConv2dTransposeOp(OpTest):
class
TestCudnn
(
TestConv2dTransposeOp
):
class
TestCudnn
(
TestConv2dTransposeOp
):
def
init_op_type
(
self
):
def
init_op_type
(
self
):
self
.
op_type
=
"conv2dtranspose_cudnn"
self
.
op_type
=
"conv2d
_
transpose_cudnn"
if
__name__
==
'__main__'
:
if
__name__
==
'__main__'
:
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录