Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
BaiXuePrincess
Paddle
提交
5d48e9cc
P
Paddle
项目概览
BaiXuePrincess
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
5d48e9cc
编写于
4月 16, 2019
作者:
X
xuezhong
提交者:
GitHub
4月 16, 2019
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request #16884 from liuwei1031/release/1.4
test=release/1.4 cherry-pick (#16845)
上级
a5ef6bff
055a5de2
变更
4
隐藏空白更改
内联
并排
Showing
4 changed file
with
81 addition
and
24 deletion
+81
-24
paddle/fluid/operators/lstmp_op.cc
paddle/fluid/operators/lstmp_op.cc
+43
-6
paddle/fluid/operators/lstmp_op.h
paddle/fluid/operators/lstmp_op.h
+2
-2
paddle/fluid/operators/sample_logits_op.cc
paddle/fluid/operators/sample_logits_op.cc
+31
-15
python/paddle/fluid/layers/nn.py
python/paddle/fluid/layers/nn.py
+5
-1
未找到文件。
paddle/fluid/operators/lstmp_op.cc
浏览文件 @
5d48e9cc
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
limitations under the License. */
limitations under the License. */
#include "paddle/fluid/operators/lstmp_op.h"
#include "paddle/fluid/operators/lstmp_op.h"
#include <memory>
#include <string>
#include <string>
namespace
paddle
{
namespace
paddle
{
...
@@ -45,6 +46,7 @@ class LSTMPOp : public framework::OperatorWithKernel {
...
@@ -45,6 +46,7 @@ class LSTMPOp : public framework::OperatorWithKernel {
"Output(BatchHidden) of LSTMP operator should not be null."
);
"Output(BatchHidden) of LSTMP operator should not be null."
);
auto
in_dims
=
ctx
->
GetInputDim
(
"Input"
);
auto
in_dims
=
ctx
->
GetInputDim
(
"Input"
);
PADDLE_ENFORCE_EQ
(
in_dims
.
size
(),
2
,
PADDLE_ENFORCE_EQ
(
in_dims
.
size
(),
2
,
"Input(X)'s rank of LSTMP operator must be 2."
);
"Input(X)'s rank of LSTMP operator must be 2."
);
...
@@ -269,13 +271,47 @@ Users can choose to use fully-connected operator before LSTMP operator.
...
@@ -269,13 +271,47 @@ Users can choose to use fully-connected operator before LSTMP operator.
}
}
};
};
class
LSTMPGradMaker
:
public
framework
::
SingleGradOpDescMaker
{
public:
using
framework
::
SingleGradOpDescMaker
::
SingleGradOpDescMaker
;
protected:
std
::
unique_ptr
<
framework
::
OpDesc
>
Apply
()
const
override
{
auto
*
grad_op
=
new
framework
::
OpDesc
();
grad_op
->
SetType
(
"lstmp_grad"
);
grad_op
->
SetInput
(
"Weight"
,
Input
(
"Weight"
));
grad_op
->
SetInput
(
"ProjWeight"
,
Input
(
"ProjWeight"
));
grad_op
->
SetInput
(
"Bias"
,
Input
(
"Bias"
));
grad_op
->
SetInput
(
"Projection"
,
Output
(
"Projection"
));
grad_op
->
SetInput
(
"Cell"
,
Output
(
"Cell"
));
grad_op
->
SetInput
(
"BatchGate"
,
Output
(
"BatchGate"
));
grad_op
->
SetInput
(
"BatchCellPreAct"
,
Output
(
"BatchCellPreAct"
));
grad_op
->
SetInput
(
"BatchHidden"
,
Output
(
"BatchHidden"
));
grad_op
->
SetInput
(
"H0"
,
Input
(
"H0"
));
grad_op
->
SetInput
(
"C0"
,
Input
(
"C0"
));
grad_op
->
SetInput
(
framework
::
GradVarName
(
"Projection"
),
OutputGrad
(
"Projection"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"Input"
),
InputGrad
(
"Input"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"Weight"
),
InputGrad
(
"Weight"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"ProjWeight"
),
InputGrad
(
"ProjWeight"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"Bias"
),
InputGrad
(
"Bias"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"H0"
),
InputGrad
(
"H0"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"C0"
),
InputGrad
(
"C0"
));
grad_op
->
SetAttrMap
(
Attrs
());
return
std
::
unique_ptr
<
framework
::
OpDesc
>
(
grad_op
);
}
};
class
LSTMPGradOp
:
public
framework
::
OperatorWithKernel
{
class
LSTMPGradOp
:
public
framework
::
OperatorWithKernel
{
public:
public:
using
framework
::
OperatorWithKernel
::
OperatorWithKernel
;
using
framework
::
OperatorWithKernel
::
OperatorWithKernel
;
void
InferShape
(
framework
::
InferShapeContext
*
ctx
)
const
override
{
void
InferShape
(
framework
::
InferShapeContext
*
ctx
)
const
override
{
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Input"
),
"Input(Input) of LSTMP operator should not be null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Projection"
),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Projection"
),
"Input(Projection) of LSTMP operator should not be null."
);
"Input(Projection) of LSTMP operator should not be null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Cell"
),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Cell"
),
...
@@ -298,7 +334,8 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
...
@@ -298,7 +334,8 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
ctx
->
SetOutputDim
(
g_name
,
ctx
->
GetInputDim
(
name
));
ctx
->
SetOutputDim
(
g_name
,
ctx
->
GetInputDim
(
name
));
};
};
SetOutGradDim
(
"Input"
);
ctx
->
SetOutputDim
(
framework
::
GradVarName
(
"Input"
),
ctx
->
GetInputDim
(
"BatchGate"
));
SetOutGradDim
(
"Weight"
);
SetOutGradDim
(
"Weight"
);
SetOutGradDim
(
"ProjWeight"
);
SetOutGradDim
(
"ProjWeight"
);
SetOutGradDim
(
"Bias"
);
SetOutGradDim
(
"Bias"
);
...
@@ -310,7 +347,8 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
...
@@ -310,7 +347,8 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
framework
::
OpKernelType
GetExpectedKernelType
(
framework
::
OpKernelType
GetExpectedKernelType
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
return
framework
::
OpKernelType
(
return
framework
::
OpKernelType
(
ctx
.
Input
<
framework
::
LoDTensor
>
(
"Input"
)
->
type
(),
ctx
.
device_context
());
ctx
.
Input
<
framework
::
LoDTensor
>
(
"BatchGate"
)
->
type
(),
ctx
.
device_context
());
}
}
};
};
...
@@ -318,8 +356,7 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
...
@@ -318,8 +356,7 @@ class LSTMPGradOp : public framework::OperatorWithKernel {
}
// namespace paddle
}
// namespace paddle
namespace
ops
=
paddle
::
operators
;
namespace
ops
=
paddle
::
operators
;
REGISTER_OPERATOR
(
lstmp
,
ops
::
LSTMPOp
,
ops
::
LSTMPOpMaker
,
REGISTER_OPERATOR
(
lstmp
,
ops
::
LSTMPOp
,
ops
::
LSTMPOpMaker
,
ops
::
LSTMPGradMaker
);
paddle
::
framework
::
DefaultGradOpDescMaker
<
true
>
);
REGISTER_OPERATOR
(
lstmp_grad
,
ops
::
LSTMPGradOp
);
REGISTER_OPERATOR
(
lstmp_grad
,
ops
::
LSTMPGradOp
);
REGISTER_OP_CPU_KERNEL
(
REGISTER_OP_CPU_KERNEL
(
lstmp
,
ops
::
LSTMPKernel
<
paddle
::
platform
::
CPUDeviceContext
,
float
>
,
lstmp
,
ops
::
LSTMPKernel
<
paddle
::
platform
::
CPUDeviceContext
,
float
>
,
...
...
paddle/fluid/operators/lstmp_op.h
浏览文件 @
5d48e9cc
...
@@ -267,7 +267,6 @@ class LSTMPGradKernel : public framework::OpKernel<T> {
...
@@ -267,7 +267,6 @@ class LSTMPGradKernel : public framework::OpKernel<T> {
}
}
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
void
Compute
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
auto
*
input
=
ctx
.
Input
<
LoDTensor
>
(
"Input"
);
auto
*
weight
=
ctx
.
Input
<
Tensor
>
(
"Weight"
);
auto
*
weight
=
ctx
.
Input
<
Tensor
>
(
"Weight"
);
auto
*
proj_weight
=
ctx
.
Input
<
Tensor
>
(
"ProjWeight"
);
auto
*
proj_weight
=
ctx
.
Input
<
Tensor
>
(
"ProjWeight"
);
auto
*
bias
=
ctx
.
Input
<
Tensor
>
(
"Bias"
);
auto
*
bias
=
ctx
.
Input
<
Tensor
>
(
"Bias"
);
...
@@ -323,7 +322,8 @@ class LSTMPGradKernel : public framework::OpKernel<T> {
...
@@ -323,7 +322,8 @@ class LSTMPGradKernel : public framework::OpKernel<T> {
ordered_c0_g
.
mutable_data
<
T
>
(
c0_g
->
dims
(),
ctx
.
GetPlace
());
ordered_c0_g
.
mutable_data
<
T
>
(
c0_g
->
dims
(),
ctx
.
GetPlace
());
}
}
auto
in_dims
=
input
->
dims
();
// batch_gate dims equal to input dims
auto
in_dims
=
batch_gate
->
dims
();
auto
out_dims
=
cell_out
->
dims
();
auto
out_dims
=
cell_out
->
dims
();
framework
::
DDim
proj_dims
({
in_dims
[
0
],
proj_weight
->
dims
()[
1
]});
framework
::
DDim
proj_dims
({
in_dims
[
0
],
proj_weight
->
dims
()[
1
]});
int
frame_size
=
static_cast
<
int
>
(
in_dims
[
1
]
/
4
);
int
frame_size
=
static_cast
<
int
>
(
in_dims
[
1
]
/
4
);
...
...
paddle/fluid/operators/sample_logits_op.cc
浏览文件 @
5d48e9cc
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
...
@@ -13,6 +13,7 @@ See the License for the specific language governing permissions and
limitations under the License. */
limitations under the License. */
#include "paddle/fluid/operators/sample_logits_op.h"
#include "paddle/fluid/operators/sample_logits_op.h"
#include <memory>
#include "paddle/fluid/operators/math/sample_prob.h"
#include "paddle/fluid/operators/math/sample_prob.h"
namespace
paddle
{
namespace
paddle
{
...
@@ -60,6 +61,10 @@ class SampleLogitsOpMaker : public framework::OpProtoAndCheckerMaker {
...
@@ -60,6 +61,10 @@ class SampleLogitsOpMaker : public framework::OpProtoAndCheckerMaker {
"(Tensor, default: Tensor<float>), A 2-D tensor with shape [N, NT + S]."
"(Tensor, default: Tensor<float>), A 2-D tensor with shape [N, NT + S]."
"The probabilites of sampled positive and negtive labels."
)
"The probabilites of sampled positive and negtive labels."
)
.
AsIntermediate
();
.
AsIntermediate
();
AddOutput
(
"LogitsDim"
,
"Store dim information of Logits for gradient op"
)
.
AsIntermediate
();
AddOutput
(
"LabelsDim"
,
"Store dim information of Logits for gradient op"
)
.
AsIntermediate
();
AddOutput
(
"SampledLogits"
,
AddOutput
(
"SampledLogits"
,
"(Tensor, default: Tensor<float>), A 2-D tensor with shape"
"(Tensor, default: Tensor<float>), A 2-D tensor with shape"
"[N, NT + S]. The outputs value of sampled logits, which will be"
"[N, NT + S]. The outputs value of sampled logits, which will be"
...
@@ -121,6 +126,10 @@ class SampleLogitsOp : public framework::OperatorWithKernel {
...
@@ -121,6 +126,10 @@ class SampleLogitsOp : public framework::OperatorWithKernel {
"Output(SampledLogits) should be not null."
);
"Output(SampledLogits) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
"SampledLabels"
),
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
"SampledLabels"
),
"Output(SampledLabels) should be not null."
);
"Output(SampledLabels) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
"LogitsDim"
),
"Output(LogitsDim) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
"LabelsDim"
),
"Output(LabelsDim) should be not null."
);
auto
logits_dims
=
ctx
->
GetInputDim
(
"Logits"
);
auto
logits_dims
=
ctx
->
GetInputDim
(
"Logits"
);
auto
labels_dims
=
ctx
->
GetInputDim
(
"Labels"
);
auto
labels_dims
=
ctx
->
GetInputDim
(
"Labels"
);
...
@@ -137,6 +146,15 @@ class SampleLogitsOp : public framework::OperatorWithKernel {
...
@@ -137,6 +146,15 @@ class SampleLogitsOp : public framework::OperatorWithKernel {
ctx
->
SetOutputDim
(
"Probabilities"
,
{
logits_dims
[
0
],
num_sampled_classes
});
ctx
->
SetOutputDim
(
"Probabilities"
,
{
logits_dims
[
0
],
num_sampled_classes
});
ctx
->
SetOutputDim
(
"SampledLogits"
,
{
logits_dims
[
0
],
num_sampled_classes
});
ctx
->
SetOutputDim
(
"SampledLogits"
,
{
logits_dims
[
0
],
num_sampled_classes
});
ctx
->
SetOutputDim
(
"SampledLabels"
,
{
logits_dims
[
0
],
labels_dims
[
1
]});
ctx
->
SetOutputDim
(
"SampledLabels"
,
{
logits_dims
[
0
],
labels_dims
[
1
]});
// append 0 to shape variable to avoid optimized by memory optimize pass
auto
logits_dim_vec
=
framework
::
vectorize
(
logits_dims
);
logits_dim_vec
.
push_back
(
0
);
ctx
->
SetOutputDim
(
"LogitsDim"
,
framework
::
make_ddim
(
logits_dim_vec
));
auto
labels_dim_vec
=
framework
::
vectorize
(
labels_dims
);
labels_dim_vec
.
push_back
(
0
);
ctx
->
SetOutputDim
(
"LabelsDim"
,
framework
::
make_ddim
(
labels_dim_vec
));
}
}
protected:
protected:
...
@@ -155,28 +173,27 @@ class SampleLogitsOpGrad : public framework::OperatorWithKernel {
...
@@ -155,28 +173,27 @@ class SampleLogitsOpGrad : public framework::OperatorWithKernel {
using
framework
::
OperatorWithKernel
::
OperatorWithKernel
;
using
framework
::
OperatorWithKernel
::
OperatorWithKernel
;
void
InferShape
(
framework
::
InferShapeContext
*
ctx
)
const
override
{
void
InferShape
(
framework
::
InferShapeContext
*
ctx
)
const
override
{
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Logits"
),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Logits
Dim
"
),
"Input(Logits) should not be null."
);
"Input(Logits
Dim
) should not be null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Labels"
),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Labels
Dim
"
),
"Input(Labels) should be not null."
);
"Input(Labels
Dim
) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Samples"
),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"Samples"
),
"Input(Samples) should be not null."
);
"Input(Samples) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
"SampledLogits"
),
"Input(SampledLogits) should be not null."
);
PADDLE_ENFORCE
(
ctx
->
HasInput
(
framework
::
GradVarName
(
"SampledLogits"
)),
PADDLE_ENFORCE
(
ctx
->
HasInput
(
framework
::
GradVarName
(
"SampledLogits"
)),
"Input(SampledLogits@Grad) should not be null."
);
"Input(SampledLogits@Grad) should not be null."
);
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
framework
::
GradVarName
(
"Logits"
)),
PADDLE_ENFORCE
(
ctx
->
HasOutput
(
framework
::
GradVarName
(
"Logits"
)),
"Output(Logits@Grad) should be not null."
);
"Output(Logits@Grad) should be not null."
);
auto
logit_dims
=
ctx
->
GetInputDim
(
"Logits"
);
auto
logits_dims
=
ctx
->
GetInputDim
(
"LogitsDim"
);
auto
label_dims
=
ctx
->
GetInputDim
(
"Labels"
);
logits_dims
=
framework
::
DDim
(
logits_dims
.
Get
(),
logits_dims
.
size
()
-
1
);
PADDLE_ENFORCE_EQ
(
label_dims
.
size
(),
2UL
,
auto
labels_dims
=
ctx
->
GetInputDim
(
"LabelsDim"
);
labels_dims
=
framework
::
DDim
(
labels_dims
.
Get
(),
labels_dims
.
size
()
-
1
);
PADDLE_ENFORCE_EQ
(
labels_dims
.
size
(),
2UL
,
"The label should be a 2-D tensor."
);
"The label should be a 2-D tensor."
);
PADDLE_ENFORCE_EQ
(
logit_dims
.
size
(),
2UL
,
PADDLE_ENFORCE_EQ
(
logit
s
_dims
.
size
(),
2UL
,
"The logits should be a 2-D tensor."
);
"The logits should be a 2-D tensor."
);
ctx
->
SetOutputDim
(
framework
::
GradVarName
(
"Logits"
),
ctx
->
SetOutputDim
(
framework
::
GradVarName
(
"Logits"
),
logits_dims
);
ctx
->
GetInputDim
(
"Logits"
));
}
}
protected:
protected:
...
@@ -199,10 +216,9 @@ class SampleLogitsGradMaker : public framework::SingleGradOpDescMaker {
...
@@ -199,10 +216,9 @@ class SampleLogitsGradMaker : public framework::SingleGradOpDescMaker {
std
::
unique_ptr
<
framework
::
OpDesc
>
Apply
()
const
override
{
std
::
unique_ptr
<
framework
::
OpDesc
>
Apply
()
const
override
{
auto
*
grad_op
=
new
framework
::
OpDesc
();
auto
*
grad_op
=
new
framework
::
OpDesc
();
grad_op
->
SetType
(
"sample_logits_grad"
);
grad_op
->
SetType
(
"sample_logits_grad"
);
grad_op
->
SetInput
(
"Logits
"
,
Input
(
"Logits
"
));
grad_op
->
SetInput
(
"Logits
Dim"
,
Output
(
"LogitsDim
"
));
grad_op
->
SetInput
(
"Labels
"
,
Input
(
"Labels
"
));
grad_op
->
SetInput
(
"Labels
Dim"
,
Output
(
"LabelsDim
"
));
grad_op
->
SetInput
(
"Samples"
,
Output
(
"Samples"
));
grad_op
->
SetInput
(
"Samples"
,
Output
(
"Samples"
));
grad_op
->
SetInput
(
"SampledLogits"
,
Output
(
"SampledLogits"
));
grad_op
->
SetInput
(
framework
::
GradVarName
(
"SampledLogits"
),
grad_op
->
SetInput
(
framework
::
GradVarName
(
"SampledLogits"
),
OutputGrad
(
"SampledLogits"
));
OutputGrad
(
"SampledLogits"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"Logits"
),
InputGrad
(
"Logits"
));
grad_op
->
SetOutput
(
framework
::
GradVarName
(
"Logits"
),
InputGrad
(
"Logits"
));
...
...
python/paddle/fluid/layers/nn.py
浏览文件 @
5d48e9cc
...
@@ -6144,6 +6144,8 @@ def sampled_softmax_with_cross_entropy(logits,
...
@@ -6144,6 +6144,8 @@ def sampled_softmax_with_cross_entropy(logits,
sampled_label
=
helper
.
create_variable_for_type_inference
(
dtype
=
'int64'
)
sampled_label
=
helper
.
create_variable_for_type_inference
(
dtype
=
'int64'
)
sampled_softlabel
=
helper
.
create_variable_for_type_inference
(
sampled_softlabel
=
helper
.
create_variable_for_type_inference
(
dtype
=
logits
.
dtype
)
dtype
=
logits
.
dtype
)
logits_dim
=
helper
.
create_variable_for_type_inference
(
dtype
=
logits
.
dtype
)
labels_dim
=
helper
.
create_variable_for_type_inference
(
dtype
=
label
.
type
)
helper
.
append_op
(
helper
.
append_op
(
type
=
'sample_logits'
,
type
=
'sample_logits'
,
...
@@ -6157,7 +6159,9 @@ def sampled_softmax_with_cross_entropy(logits,
...
@@ -6157,7 +6159,9 @@ def sampled_softmax_with_cross_entropy(logits,
'Samples'
:
samples
,
'Samples'
:
samples
,
'Probabilities'
:
probabilities
,
'Probabilities'
:
probabilities
,
'SampledLabels'
:
sampled_label
,
'SampledLabels'
:
sampled_label
,
'SampledLogits'
:
sampled_logits
'SampledLogits'
:
sampled_logits
,
'LogitsDim'
:
logits_dim
,
'LabelsDim'
:
labels_dim
},
},
attrs
=
{
attrs
=
{
'use_customized_samples'
:
use_customized_samples
,
'use_customized_samples'
:
use_customized_samples
,
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录