Merge pull request #11017 from NHZlX/fix_depthwise_neon_bug

fix neon depthwise conv bug

Merge pull request #11017 from NHZlX/fix_depthwise_neon_bug
fix neon depthwise conv bug
2c14df34 · Zhaolong Xing · GitHub · 3e177b9d · 75d987a5 · 2c14df34
隐藏空白更改
内联并排

Showing with 12 addition and 12 deletion

paddle/function/neon/NeonDepthwiseConv.cpp paddle/function/neon/NeonDepthwiseConv.cpp +12 -12

未找到文件。
--- a/paddle/function/neon/NeonDepthwiseConv.cpp
+++ b/paddle/function/neon/NeonDepthwiseConv.cpp
@@ -66,18 +66,18 @@ class NeonDepthwiseConvFunction : public ConvFunctionBase {
    float* inputPadding = inputData;
    int padInputHeight = inputHeight + 2 * paddingH();
    int padInputWidth = inputWidth + 2 * paddingW();
-    if (paddingH() > 0 || paddingW() > 0) {
+    int newSize =
-      int newSize = batchSize * inputChannels * padInputHeight * padInputWidth;
+        batchSize * (inputChannels + 1) * padInputHeight * padInputWidth;
-      resizeBuffer<Device>(newSize);
-      inputPadding = reinterpret_cast<float*>(memory_->getBuf());
+    resizeBuffer<Device>(newSize);
-      neon::Padding<float>::run(inputData,
+    inputPadding = reinterpret_cast<float*>(memory_->getBuf());
-                                inputPadding,
+    neon::Padding<float>::run(inputData,
-                                batchSize * inputChannels,
+                              inputPadding,
-                                inputHeight,
+                              batchSize * inputChannels,
-                                inputWidth,
+                              inputHeight,
-                                padInputHeight,
+                              inputWidth,
-                                padInputWidth);
+                              padInputHeight,
-    }
+                              padInputWidth);
    std::function<void(
        const float*, const float*, int, int, int, int, int, int, float*)>