Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
s920243400
PaddleDetection
提交
976f96a9
P
PaddleDetection
项目概览
s920243400
/
PaddleDetection
与 Fork 源项目一致
Fork自
PaddlePaddle / PaddleDetection
通知
2
Star
0
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
P
PaddleDetection
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
未验证
提交
976f96a9
编写于
11月 28, 2017
作者:
P
peterzhang2029
提交者:
GitHub
11月 28, 2017
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request #5926 from peterzhang2029/hsigmoid_gpu
Fix hsigmoid_layer when using GPU.
上级
c975fe1b
b156c6a3
变更
3
隐藏空白更改
内联
并排
Showing
3 changed file
with
140 addition
and
24 deletion
+140
-24
paddle/gserver/layers/HierarchicalSigmoidLayer.cpp
paddle/gserver/layers/HierarchicalSigmoidLayer.cpp
+124
-18
paddle/gserver/layers/HierarchicalSigmoidLayer.h
paddle/gserver/layers/HierarchicalSigmoidLayer.h
+9
-0
paddle/gserver/tests/test_LayerGrad.cpp
paddle/gserver/tests/test_LayerGrad.cpp
+7
-6
未找到文件。
paddle/gserver/layers/HierarchicalSigmoidLayer.cpp
浏览文件 @
976f96a9
...
...
@@ -64,49 +64,111 @@ void HierarchicalSigmoidLayer::forward(PassType passType) {
batchSize
,
codeLength_
,
/* trans */
false
,
useGpu
(
deviceId_
)
);
false
);
Matrix
::
resizeOrCreate
(
preOutput_
.
grad
,
batchSize
,
codeLength_
,
/* trans */
false
,
useGpu
(
deviceId_
));
false
);
IVectorPtr
label
=
getInput
(
*
getLabelLayer
()).
ids
;
preOutput_
.
value
->
zeroMem
();
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuOutput_
,
output_
.
value
->
getHeight
(),
output_
.
value
->
getWidth
(),
/* trans */
false
,
false
);
IVector
::
resizeOrCreate
(
cpuLabel_
,
label
->
getSize
(),
false
);
cpuLabel_
->
copyFrom
(
*
label
);
cpuOutput_
->
copyFrom
(
*
output_
.
value
);
}
else
{
cpuOutput_
=
output_
.
value
;
cpuLabel_
=
label
;
}
/* add the bias-vector */
if
(
biases_
.
get
()
!=
NULL
)
{
preOutput_
.
value
->
addByBitCode
(
numClasses_
,
*
label
,
*
biases_
->
getW
());
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuBias_
,
1
,
numClasses_
-
1
,
/* trans */
false
,
false
);
cpuBias_
->
copyFrom
(
*
biases_
->
getW
());
}
else
{
cpuBias_
=
biases_
->
getW
();
}
preOutput_
.
value
->
addByBitCode
(
numClasses_
,
*
cpuLabel_
,
*
cpuBias_
);
}
for
(
size_t
i
=
0
;
i
<
inputLayers_
.
size
()
-
1
;
++
i
)
{
MatrixPtr
input
=
getInputValue
(
i
);
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuInput_
,
input
->
getHeight
(),
input
->
getWidth
(),
/* trans */
false
,
false
);
Matrix
::
resizeOrCreate
(
cpuWeight_
,
weights_
[
i
]
->
getW
()
->
getHeight
(),
weights_
[
i
]
->
getW
()
->
getWidth
(),
/* trans */
false
,
false
);
cpuInput_
->
copyFrom
(
*
input
);
cpuWeight_
->
copyFrom
(
*
weights_
[
i
]
->
getW
());
}
else
{
cpuInput_
=
input
;
cpuWeight_
=
weights_
[
i
]
->
getW
();
}
preOutput_
.
value
->
mulByBitCode
(
numClasses_
,
*
label
,
*
weights_
[
i
]
->
getW
(),
*
input
);
numClasses_
,
*
cpuLabel_
,
*
cpuWeight_
,
*
cpuInput_
);
}
// keep consistent with the clipping in the following softrelu
preOutput_
.
value
->
clip
(
-
40.0
,
40.0
);
preOutput_
.
value
->
sumByBitCode
(
numClasses_
,
*
label
,
*
output_
.
value
,
*
cpuLabel_
,
*
cpuOutput_
,
-
1
);
// scaleSum
preOutput_
.
value
->
softrelu
(
*
preOutput_
.
value
);
MatrixPtr
sum
=
Matrix
::
create
(
batchSize
,
1
,
/* trans= */
false
,
useGpu
(
deviceId_
));
MatrixPtr
sum
=
Matrix
::
create
(
batchSize
,
1
,
/* trans= */
false
,
false
);
preOutput_
.
value
->
rowSum
(
*
sum
);
output_
.
value
->
add
(
*
sum
);
cpuOutput_
->
add
(
*
sum
);
if
(
useGpu_
)
{
output_
.
value
->
copyFrom
(
*
cpuOutput_
);
}
else
{
output_
.
value
=
cpuOutput_
;
}
}
void
HierarchicalSigmoidLayer
::
backward
(
const
UpdateCallback
&
callback
)
{
IVectorPtr
label
=
getInput
(
*
getLabelLayer
()).
ids
;
if
(
useGpu_
)
{
IVector
::
resizeOrCreate
(
cpuLabel_
,
label
->
getSize
(),
false
);
cpuLabel_
->
copyFrom
(
*
label
);
}
else
{
cpuLabel_
=
label
;
}
preOutput_
.
grad
->
one
();
preOutput_
.
grad
->
softreluDerivative
(
*
preOutput_
.
value
);
preOutput_
.
grad
->
subByBitCode
(
numClasses_
,
*
label
);
preOutput_
.
grad
->
subByBitCode
(
numClasses_
,
*
cpuLabel_
);
if
(
biases_
&&
biases_
->
getWGrad
())
{
preOutput_
.
grad
->
addByBitCodeBackward
(
numClasses_
,
*
label
,
*
biases_
->
getWGrad
());
MatrixPtr
biases_grad
=
biases_
->
getWGrad
();
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuBias_
,
1
,
numClasses_
-
1
,
/* trans */
false
,
false
);
cpuBias_
->
copyFrom
(
*
biases_grad
);
}
else
{
cpuBias_
=
biases_grad
;
}
preOutput_
.
grad
->
addByBitCodeBackward
(
numClasses_
,
*
cpuLabel_
,
*
cpuBias_
);
if
(
useGpu
)
{
biases_grad
->
copyFrom
(
*
cpuBias_
);
}
else
{
biases_grad
=
cpuBias_
;
}
/* Increasing the number of gradient */
biases_
->
getParameterPtr
()
->
incUpdate
(
callback
);
}
...
...
@@ -115,9 +177,31 @@ void HierarchicalSigmoidLayer::backward(const UpdateCallback& callback) {
/* Calculate the W-gradient for the current layer */
MatrixPtr
input
=
getInputValue
(
i
);
if
(
weights_
[
i
]
->
getWGrad
())
{
MatrixPtr
weights_grad
=
weights_
[
i
]
->
getWGrad
();
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuInput_
,
input
->
getHeight
(),
input
->
getWidth
(),
/* trans */
false
,
false
);
Matrix
::
resizeOrCreate
(
cpuWeightGrad_
,
weights_grad
->
getHeight
(),
weights_grad
->
getWidth
(),
/* trans */
false
,
false
);
cpuInput_
->
copyFrom
(
*
input
);
cpuWeightGrad_
->
copyFrom
(
*
weights_grad
);
}
else
{
cpuInput_
=
input
;
cpuWeightGrad_
=
weights_grad
;
}
preOutput_
.
grad
->
mulByBitCodeBackwardWeight
(
numClasses_
,
*
label
,
*
weights_
[
i
]
->
getWGrad
(),
*
input
);
numClasses_
,
*
cpuLabel_
,
*
cpuWeightGrad_
,
*
cpuInput_
);
if
(
useGpu_
)
{
weights_grad
->
copyFrom
(
*
cpuWeightGrad_
);
}
else
{
weights_grad
=
cpuWeightGrad_
;
}
/* Increasing the number of gradient */
weights_
[
i
]
->
getParameterPtr
()
->
incUpdate
(
callback
);
}
...
...
@@ -125,8 +209,30 @@ void HierarchicalSigmoidLayer::backward(const UpdateCallback& callback) {
/* Calculate the input layers error */
MatrixPtr
inputGrad
=
getInputGrad
(
i
);
if
(
inputGrad
)
{
if
(
useGpu_
)
{
Matrix
::
resizeOrCreate
(
cpuInputGrad_
,
inputGrad
->
getHeight
(),
inputGrad
->
getWidth
(),
/* trans */
false
,
false
);
Matrix
::
resizeOrCreate
(
cpuWeight_
,
weights_
[
i
]
->
getW
()
->
getHeight
(),
weights_
[
i
]
->
getW
()
->
getWidth
(),
/* trans */
false
,
false
);
cpuInputGrad_
->
copyFrom
(
*
inputGrad
);
cpuWeight_
->
copyFrom
(
*
weights_
[
i
]
->
getW
());
}
else
{
cpuInputGrad_
=
inputGrad
;
cpuWeight_
=
weights_
[
i
]
->
getW
();
}
preOutput_
.
grad
->
mulByBitCodeBackwardError
(
numClasses_
,
*
label
,
*
weights_
[
i
]
->
getW
(),
*
inputGrad
);
numClasses_
,
*
cpuLabel_
,
*
cpuWeight_
,
*
cpuInputGrad_
);
if
(
useGpu_
)
{
inputGrad
->
copyFrom
(
*
cpuInputGrad_
);
}
else
{
inputGrad
=
cpuInputGrad_
;
}
}
}
}
...
...
paddle/gserver/layers/HierarchicalSigmoidLayer.h
浏览文件 @
976f96a9
...
...
@@ -80,6 +80,15 @@ protected:
int
codeLength_
;
/// temporary result of output_
Argument
preOutput_
;
/// The temporary variables in CPU memory.
MatrixPtr
cpuWeight_
;
MatrixPtr
cpuWeightGrad_
;
MatrixPtr
cpuInput_
;
MatrixPtr
cpuInputGrad_
;
MatrixPtr
cpuBias_
;
MatrixPtr
cpuOutput_
;
IVectorPtr
cpuLabel_
;
};
}
// namespace paddle
paddle/gserver/tests/test_LayerGrad.cpp
浏览文件 @
976f96a9
...
...
@@ -681,12 +681,13 @@ TEST(Layer, hsigmoidLayer) {
config
.
layerConfig
.
add_inputs
();
config
.
layerConfig
.
add_inputs
();
// Not support GPU now
testLayerGrad
(
config
,
"hsigmoid"
,
100
,
/* trans */
false
,
/* useGpu */
false
);
for
(
auto
useGpu
:
{
false
,
true
})
{
testLayerGrad
(
config
,
"hsigmoid"
,
100
,
/* trans */
false
,
/* useGpu */
useGpu
);
}
}
TEST
(
Layer
,
multi_cross
)
{
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录