Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Crayon鑫
Paddle
提交
af0264aa
P
Paddle
项目概览
Crayon鑫
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
af0264aa
编写于
9月 05, 2017
作者:
F
fengjiayi
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Add global function `FalttenToMatrix` and add `axis` for MulOp
上级
86655cb9
变更
2
显示空白变更内容
内联
并排
Showing
2 changed file
with
53 addition
and
22 deletion
+53
-22
paddle/operators/mul_op.cc
paddle/operators/mul_op.cc
+14
-11
paddle/operators/mul_op.h
paddle/operators/mul_op.h
+39
-11
未找到文件。
paddle/operators/mul_op.cc
浏览文件 @
af0264aa
...
@@ -27,24 +27,25 @@ class MulOp : public framework::OperatorWithKernel {
...
@@ -27,24 +27,25 @@ class MulOp : public framework::OperatorWithKernel {
void
InferShape
(
const
framework
::
InferShapeContext
&
ctx
)
const
override
{
void
InferShape
(
const
framework
::
InferShapeContext
&
ctx
)
const
override
{
auto
x_dim
=
ctx
.
Input
<
Tensor
>
(
"X"
)
->
dims
();
auto
x_dim
=
ctx
.
Input
<
Tensor
>
(
"X"
)
->
dims
();
auto
y_dim
=
ctx
.
Input
<
Tensor
>
(
"Y"
)
->
dims
();
auto
y_dim
=
ctx
.
Input
<
Tensor
>
(
"Y"
)
->
dims
();
int
x_num_row_dims
=
GetAttr
<
int
>
(
"
X_num_ra
w_dims"
);
int
x_num_row_dims
=
GetAttr
<
int
>
(
"
x_num_ro
w_dims"
);
int
y_num_row_dims
=
GetAttr
<
int
>
(
"
Y_num_ra
w_dims"
);
int
y_num_row_dims
=
GetAttr
<
int
>
(
"
y_num_ro
w_dims"
);
PADDLE_ENFORCE
(
x_dim
.
size
()
>
x_num_row_dims
,
PADDLE_ENFORCE
(
x_dim
.
size
()
>
x_num_row_dims
,
"The rank of input tensor X(%s) should be larger than "
"The rank of input tensor X(%s) should be larger than "
"`mul_op`'s `
X_num_ra
w_dims`."
,
"`mul_op`'s `
x_num_ro
w_dims`."
,
ctx
.
op
().
Input
(
"X"
));
ctx
.
op
().
Input
(
"X"
));
PADDLE_ENFORCE
(
y_dim
.
size
()
>
y_num_row_dims
,
PADDLE_ENFORCE
(
y_dim
.
size
()
>
y_num_row_dims
,
"The rank of input tensor Y(%s) should be larger than "
"The rank of input tensor Y(%s) should be larger than "
"`mul_op`'s `
Y_num_ra
w_dims`."
,
"`mul_op`'s `
y_num_ro
w_dims`."
,
ctx
.
op
().
Input
(
"Y"
));
ctx
.
op
().
Input
(
"Y"
));
PADDLE_ENFORCE_EQ
(
PADDLE_ENFORCE_EQ
(
product
(
x_dim
,
x_dim
.
size
()
-
x_num_row_dims
,
x_dim
.
size
()),
product
(
x_dim
,
x_dim
.
size
()
-
x_num_row_dims
,
x_dim
.
size
()),
product
(
y_dim
,
0
,
y_dim
.
size
()
-
y_num_row_dims
),
product
(
y_dim
,
0
,
y_dim
.
size
()
-
y_num_row_dims
),
"First matrix's width must be equal with second matrix's height."
);
"First matrix's width must be equal with second matrix's height."
);
ctx
.
Output
<
Tensor
>
(
"Out"
)
->
Resize
(
ctx
.
Output
<
Tensor
>
(
"Out"
)
->
Resize
(
{
product
(
x_dim
,
0
,
x_dim
.
size
()
-
x_num_row_dims
),
{
static_cast
<
int
>
(
product
(
x_dim
,
0
,
x_dim
.
size
()
-
x_num_row_dims
)),
product
(
y_dim
,
y_dim
.
size
()
-
y_num_row_dims
,
y_dim
.
size
())});
static_cast
<
int
>
(
product
(
y_dim
,
y_dim
.
size
()
-
y_num_row_dims
,
y_dim
.
size
()))});
}
}
};
};
...
@@ -96,10 +97,12 @@ class MulOpGrad : public framework::OperatorWithKernel {
...
@@ -96,10 +97,12 @@ class MulOpGrad : public framework::OperatorWithKernel {
auto
*
x_grad
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"X"
));
auto
*
x_grad
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"X"
));
auto
*
y_grad
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"Y"
));
auto
*
y_grad
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"Y"
));
PADDLE_ENFORCE
(
PADDLE_ENFORCE
(
product
(
x_dim
,
0
,
x_dims
.
size
()
-
x_num_row_dims
)
==
out_dims
[
0
],
product
(
x_dims
,
0
,
x_dims
.
size
()
-
GetAttr
<
int
>
(
"x_num_row_dims"
))
==
out_dims
[
0
],
"The first dimension of Out@GRAD must equal to the first dimension of "
"The first dimension of Out@GRAD must equal to the first dimension of "
"the first operand."
);
"the first operand."
);
PADDLE_ENFORCE
(
product
(
y_dim
,
y_dims
.
size
()
-
y_num_row_dims
,
PADDLE_ENFORCE
(
product
(
y_dims
,
y_dims
.
size
()
-
GetAttr
<
int
>
(
"y_num_row_dims"
),
y_dims
.
size
())
==
out_dims
[
1
],
y_dims
.
size
())
==
out_dims
[
1
],
"The second dimension of Out@GRAD must equal to the second "
"The second dimension of Out@GRAD must equal to the second "
"dimension of the second operand."
);
"dimension of the second operand."
);
...
...
paddle/operators/mul_op.h
浏览文件 @
af0264aa
...
@@ -31,13 +31,25 @@ template <typename Place, typename T>
...
@@ -31,13 +31,25 @@ template <typename Place, typename T>
class
MulKernel
:
public
framework
::
OpKernel
{
class
MulKernel
:
public
framework
::
OpKernel
{
public:
public:
void
Compute
(
const
framework
::
ExecutionContext
&
context
)
const
override
{
void
Compute
(
const
framework
::
ExecutionContext
&
context
)
const
override
{
auto
*
X
=
context
.
Input
<
Tensor
>
(
"X"
);
const
Tensor
*
X
=
context
.
Input
<
Tensor
>
(
"X"
);
auto
*
Y
=
context
.
Input
<
Tensor
>
(
"Y"
);
const
Tensor
*
Y
=
context
.
Input
<
Tensor
>
(
"Y"
);
auto
*
Z
=
context
.
Output
<
Tensor
>
(
"Out"
);
Tensor
*
Z
=
context
.
Output
<
Tensor
>
(
"Out"
);
const
Tensor
X_matrix
=
X
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
X
,
context
.
template
GetAttr
<
int
>(
"x_num_row_dims"
))
:
*
X
;
const
Tensor
Y_matrix
=
Y
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
Y
,
context
.
template
GetAttr
<
int
>(
"y_num_row_dims"
))
:
*
Y
;
Z
->
mutable_data
<
T
>
(
context
.
GetPlace
());
Z
->
mutable_data
<
T
>
(
context
.
GetPlace
());
auto
*
device_context
=
auto
*
device_context
=
const_cast
<
platform
::
DeviceContext
*>
(
context
.
device_context_
);
const_cast
<
platform
::
DeviceContext
*>
(
context
.
device_context_
);
math
::
matmul
<
Place
,
T
>
(
*
X
,
false
,
*
Y
,
false
,
1
,
Z
,
0
,
device_context
);
math
::
matmul
<
Place
,
T
>
(
X_matrix
,
false
,
Y_matrix
,
false
,
1
,
Z
,
0
,
device_context
);
}
}
};
};
...
@@ -45,20 +57,36 @@ template <typename Place, typename T>
...
@@ -45,20 +57,36 @@ template <typename Place, typename T>
class
MulGradKernel
:
public
framework
::
OpKernel
{
class
MulGradKernel
:
public
framework
::
OpKernel
{
public:
public:
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
auto
*
X
=
ctx
.
Input
<
Tensor
>
(
"X"
);
int
x_num_row_dims
=
ctx
.
template
GetAttr
<
int
>(
"x_num_row_dims"
);
auto
*
Y
=
ctx
.
Input
<
Tensor
>
(
"Y"
);
int
y_num_row_dims
=
ctx
.
template
GetAttr
<
int
>(
"y_num_row_dims"
);
auto
*
dOut
=
ctx
.
Input
<
Tensor
>
(
framework
::
GradVarName
(
"Out"
));
const
Tensor
*
X
=
ctx
.
Input
<
Tensor
>
(
"X"
);
const
Tensor
*
Y
=
ctx
.
Input
<
Tensor
>
(
"Y"
);
const
Tensor
X_matrix
=
X
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
X
,
x_num_row_dims
)
:
*
X
;
const
Tensor
Y_matrix
=
Y
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
Y
,
y_num_row_dims
)
:
*
Y
;
const
Tensor
*
dOut
=
ctx
.
Input
<
Tensor
>
(
framework
::
GradVarName
(
"Out"
));
auto
*
dX
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"X"
));
Tensor
*
dX
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"X"
));
auto
*
dY
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"Y"
));
Tensor
*
dY
=
ctx
.
Output
<
Tensor
>
(
framework
::
GradVarName
(
"Y"
));
dX
->
mutable_data
<
T
>
(
ctx
.
GetPlace
());
dX
->
mutable_data
<
T
>
(
ctx
.
GetPlace
());
dY
->
mutable_data
<
T
>
(
ctx
.
GetPlace
());
dY
->
mutable_data
<
T
>
(
ctx
.
GetPlace
());
Tensor
dX_matrix
=
dX
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
dX
,
x_num_row_dims
)
:
*
dX
;
Tensor
dY_matrix
=
dY
->
dims
().
size
()
>
2
?
framework
::
FlattenToMatrix
<
T
>
(
*
dY
,
y_num_row_dims
)
:
*
dY
;
auto
*
device_context
=
auto
*
device_context
=
const_cast
<
platform
::
DeviceContext
*>
(
ctx
.
device_context_
);
const_cast
<
platform
::
DeviceContext
*>
(
ctx
.
device_context_
);
// dX = dOut * Y'. dX: M x K, dOut : M x N, Y : K x N
// dX = dOut * Y'. dX: M x K, dOut : M x N, Y : K x N
math
::
matmul
<
Place
,
T
>
(
*
dOut
,
false
,
*
Y
,
true
,
1
,
dX
,
0
,
device_context
);
math
::
matmul
<
Place
,
T
>
(
*
dOut
,
false
,
Y_matrix
,
true
,
1
,
&
dX_matrix
,
0
,
device_context
);
// dY = X' * dOut. dY: K x N, dOut : M x N, X : M x K
// dY = X' * dOut. dY: K x N, dOut : M x N, X : M x K
math
::
matmul
<
Place
,
T
>
(
*
X
,
true
,
*
dOut
,
false
,
1
,
dY
,
0
,
device_context
);
math
::
matmul
<
Place
,
T
>
(
X_matrix
,
true
,
*
dOut
,
false
,
1
,
&
dY_matrix
,
0
,
device_context
);
}
}
};
};
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录