未验证 提交 2c14df34 编写于 作者: Z Zhaolong Xing 提交者: GitHub

Merge pull request #11017 from NHZlX/fix_depthwise_neon_bug

fix neon depthwise conv bug
......@@ -66,8 +66,9 @@ class NeonDepthwiseConvFunction : public ConvFunctionBase {
float* inputPadding = inputData;
int padInputHeight = inputHeight + 2 * paddingH();
int padInputWidth = inputWidth + 2 * paddingW();
if (paddingH() > 0 || paddingW() > 0) {
int newSize = batchSize * inputChannels * padInputHeight * padInputWidth;
int newSize =
batchSize * (inputChannels + 1) * padInputHeight * padInputWidth;
resizeBuffer<Device>(newSize);
inputPadding = reinterpret_cast<float*>(memory_->getBuf());
neon::Padding<float>::run(inputData,
......@@ -77,7 +78,6 @@ class NeonDepthwiseConvFunction : public ConvFunctionBase {
inputWidth,
padInputHeight,
padInputWidth);
}
std::function<void(
const float*, const float*, int, int, int, int, int, int, float*)>
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册