Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Crayon鑫
Paddle
提交
509cb0bc
P
Paddle
项目概览
Crayon鑫
/
Paddle
与 Fork 源项目一致
Fork自
PaddlePaddle / Paddle
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
Paddle
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
509cb0bc
编写于
6月 10, 2018
作者:
Q
qiaolongfei
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
add unit test, pass the unit test
上级
7cebec4b
变更
3
隐藏空白更改
内联
并排
Showing
3 changed file
with
64 addition
and
9 deletion
+64
-9
paddle/fluid/operators/merge_ids_op.cc
paddle/fluid/operators/merge_ids_op.cc
+10
-2
paddle/fluid/operators/merge_ids_op.h
paddle/fluid/operators/merge_ids_op.h
+16
-7
python/paddle/fluid/tests/unittests/test_merge_ids_op.py
python/paddle/fluid/tests/unittests/test_merge_ids_op.py
+38
-0
未找到文件。
paddle/fluid/operators/merge_ids_op.cc
浏览文件 @
509cb0bc
...
@@ -73,6 +73,15 @@ class MergeIdsOp : public framework::OperatorWithKernel {
...
@@ -73,6 +73,15 @@ class MergeIdsOp : public framework::OperatorWithKernel {
}
}
ctx
->
ShareLoD
(
"Ids"
,
"Out"
);
ctx
->
ShareLoD
(
"Ids"
,
"Out"
);
}
}
private:
framework
::
OpKernelType
GetExpectedKernelType
(
const
framework
::
ExecutionContext
&
ctx
)
const
override
{
return
framework
::
OpKernelType
(
framework
::
ToDataType
(
ctx
.
MultiInput
<
framework
::
Tensor
>
(
"X"
).
front
()
->
type
()),
ctx
.
GetPlace
());
}
};
};
class
MergeIdsOpInferVarType
:
public
framework
::
VarTypeInference
{
class
MergeIdsOpInferVarType
:
public
framework
::
VarTypeInference
{
...
@@ -93,5 +102,4 @@ namespace ops = paddle::operators;
...
@@ -93,5 +102,4 @@ namespace ops = paddle::operators;
REGISTER_OPERATOR
(
merge_ids
,
ops
::
MergeIdsOp
,
ops
::
MergeIdsOpMaker
,
REGISTER_OPERATOR
(
merge_ids
,
ops
::
MergeIdsOp
,
ops
::
MergeIdsOpMaker
,
ops
::
MergeIdsOpInferVarType
);
ops
::
MergeIdsOpInferVarType
);
REGISTER_OP_CPU_KERNEL
(
REGISTER_OP_CPU_KERNEL
(
merge_ids
,
ops
::
MergeIdsOpKernel
<
paddle
::
platform
::
CPUPlace
,
int64_t
>
,
merge_ids
,
ops
::
MergeIdsOpKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
ops
::
MergeIdsOpKernel
<
paddle
::
platform
::
CPUPlace
,
float
>
);
paddle/fluid/operators/merge_ids_op.h
浏览文件 @
509cb0bc
...
@@ -30,6 +30,7 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
...
@@ -30,6 +30,7 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
if
(
!
platform
::
is_cpu_place
(
place
))
{
if
(
!
platform
::
is_cpu_place
(
place
))
{
PADDLE_THROW
(
"MergeIds do not support GPU kernel"
);
PADDLE_THROW
(
"MergeIds do not support GPU kernel"
);
}
}
VLOG
(
3
)
<<
"run in MergeIdsOpKernel"
;
const
auto
*
ids_var
=
ctx
.
InputVar
(
"Ids"
);
const
auto
*
ids_var
=
ctx
.
InputVar
(
"Ids"
);
PADDLE_ENFORCE
(
ids_var
->
IsType
<
framework
::
LoDTensor
>
(),
PADDLE_ENFORCE
(
ids_var
->
IsType
<
framework
::
LoDTensor
>
(),
...
@@ -37,7 +38,7 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
...
@@ -37,7 +38,7 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
const
auto
&
ids_tensor
=
ids_var
->
Get
<
framework
::
LoDTensor
>
();
const
auto
&
ids_tensor
=
ids_var
->
Get
<
framework
::
LoDTensor
>
();
const
auto
&
ids_dims
=
ids_tensor
.
dims
();
const
auto
&
ids_dims
=
ids_tensor
.
dims
();
const
T
*
ids
=
ids_tensor
.
data
<
T
>
();
const
int64_t
*
ids
=
ids_tensor
.
data
<
int64_t
>
();
auto
x_tensors
=
ctx
.
MultiInput
<
framework
::
LoDTensor
>
(
"X"
);
auto
x_tensors
=
ctx
.
MultiInput
<
framework
::
LoDTensor
>
(
"X"
);
...
@@ -49,9 +50,11 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
...
@@ -49,9 +50,11 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
if
(
embedding_size
==
0
)
{
if
(
embedding_size
==
0
)
{
embedding_size
=
input
->
dims
()[
1
];
embedding_size
=
input
->
dims
()[
1
];
}
}
PADDLE_ENFORCE_EQ
(
embedding_size
,
input
->
dims
()[
1
],
if
(
framework
::
product
(
input
->
dims
())
!=
0
)
{
"embedding size of all input should be the same"
);
PADDLE_ENFORCE_EQ
(
embedding_size
,
input
->
dims
()[
1
],
batch_size
+=
input
->
dims
()[
0
];
"embedding size of all input should be the same"
);
batch_size
+=
input
->
dims
()[
0
];
}
}
}
PADDLE_ENFORCE_EQ
(
PADDLE_ENFORCE_EQ
(
batch_size
,
ids_dims
[
0
],
batch_size
,
ids_dims
[
0
],
...
@@ -61,13 +64,14 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
...
@@ -61,13 +64,14 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
if
(
shard_num
==
1
)
{
if
(
shard_num
==
1
)
{
VLOG
(
3
)
<<
"only one shard, we can copy the data directly"
;
VLOG
(
3
)
<<
"only one shard, we can copy the data directly"
;
TensorCopy
(
ids_tensor
,
place
,
out
);
TensorCopy
(
*
x_tensors
[
0
]
,
place
,
out
);
}
else
{
}
else
{
std
::
vector
<
int
>
in_indexs
(
shard_num
,
0
);
std
::
vector
<
int
>
in_indexs
(
shard_num
,
0
);
auto
*
out_data
=
out
->
mutable_data
<
T
>
(
ids_dims
,
place
);
auto
*
out_data
=
out
->
mutable_data
<
T
>
(
framework
::
make_ddim
({
batch_size
,
embedding_size
}),
place
);
// copy data from ins[shard_num] to out.
// copy data from ins[shard_num] to out.
for
(
int
i
=
0
;
i
<
ids_dims
[
0
];
++
i
)
{
for
(
int
i
=
0
;
i
<
ids_dims
[
0
];
++
i
)
{
T
id
=
ids
[
i
];
int64_t
id
=
ids
[
i
];
size_t
shard_id
=
static_cast
<
size_t
>
(
id
)
%
shard_num
;
size_t
shard_id
=
static_cast
<
size_t
>
(
id
)
%
shard_num
;
int
index
=
in_indexs
[
shard_id
];
int
index
=
in_indexs
[
shard_id
];
memcpy
(
out_data
+
embedding_size
*
i
,
memcpy
(
out_data
+
embedding_size
*
i
,
...
@@ -75,6 +79,11 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
...
@@ -75,6 +79,11 @@ class MergeIdsOpKernel : public framework::OpKernel<T> {
sizeof
(
T
)
*
embedding_size
);
sizeof
(
T
)
*
embedding_size
);
in_indexs
[
shard_id
]
+=
1
;
in_indexs
[
shard_id
]
+=
1
;
}
}
for
(
int
i
=
0
;
i
<
shard_num
;
++
i
)
{
PADDLE_ENFORCE_EQ
(
in_indexs
[
i
],
x_tensors
[
i
]
->
dims
()[
0
],
"after merge, all data in x_tensor should be used"
);
}
}
}
}
}
};
};
...
...
python/paddle/fluid/tests/unittests/test_merge_ids_op.py
0 → 100644
浏览文件 @
509cb0bc
# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import
unittest
import
numpy
as
np
from
op_test
import
OpTest
class
TestMergeIdsOp
(
OpTest
):
def
setUp
(
self
):
self
.
op_type
=
"merge_ids"
ids
=
np
.
array
([[
0
],
[
2
],
[
2
],
[
3
],
[
5
],
[
5
],
[
6
]]).
astype
(
'int64'
)
x0
=
np
.
array
([[
0.1
,
0.2
],
[
0.2
,
0.3
],
[
0.3
,
0.4
]]).
astype
(
'float32'
)
x1
=
np
.
array
([]).
astype
(
'float32'
)
x2
=
np
.
array
([[
0.4
,
0.5
],
[
0.4
,
0.5
],
[
0.5
,
0.6
],
[
0.5
,
0.6
]]).
astype
(
'float32'
)
out
=
np
.
array
([[
0.1
,
0.2
],
[
0.4
,
0.5
],
[
0.4
,
0.5
],
[
0.2
,
0.3
],
[
0.5
,
0.6
],
[
0.5
,
0.6
],
[
0.3
,
0.4
]]).
astype
(
'float32'
)
self
.
inputs
=
{
'Ids'
:
ids
,
"X"
:
[(
'x0'
,
x0
),
(
'x1'
,
x1
),
(
'x2'
,
x2
)]}
self
.
outputs
=
{
'Out'
:
out
}
def
test_check_output
(
self
):
self
.
check_output
()
if
__name__
==
'__main__'
:
unittest
.
main
()
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录