modify format, and modify the layer grad test, op test

1f516fa0 · xzl · 81998868 · 1f516fa0 · 1f516fa0 · 1f516fa0
3 changed file
--- a/paddle/function/ConvOpTest.cpp
+++ b/paddle/function/ConvOpTest.cpp
@@ -25,40 +25,32 @@ enum TestType {
  kBackwardFilterTest = 2,
 };
-enum LayerType {
-  convolutionType = 0,
-  depthwiseConvolutionType = 1,
-};
 template <DeviceType DType1, DeviceType DType2>
 class ConvolutionTest {
 public:
  ConvolutionTest(const std::string& conv1,
                  const std::string& conv2,
-                  LayerType layerType,
                  TestType type,
+                  bool useGroups = true,
                  std::string algo = "auto") {
    for (size_t batchSize : {1, 32}) {
      for (size_t inputSize : {7, 14, 54}) {
        for (size_t filterSize : {1, 3, 5}) {
          for (size_t inputChannels : {3, 64}) {
            for (size_t outputChannels : {3, 64, 128}) {
+              for (size_t groups : {1, 3, 64}) {
                if (inputChannels > outputChannels) break;
-              if (layerType == depthwiseConvolutionType &&
+                if (groups != 1 &&
-                  outputChannels % inputChannels != 0)
+                    (inputChannels != groups || outputChannels % groups != 0))
-                break;
+                  continue;
+                if (!useGroups) groups = 1;
-              size_t groups = 1;
-              if (layerType == depthwiseConvolutionType) {
-                groups = inputChannels;
-              }
                for (size_t stride : {1, 2}) {
                  for (size_t padding : {0, 1}) {
                    if (padding >= filterSize) break;
                    size_t outputSize =
-                      (inputSize - filterSize + 2 * padding + stride) / stride;
+                        (inputSize - filterSize + 2 * padding + stride) /
+                        stride;
                    VLOG(3) << " batchSize=" << batchSize
                            << " inputChannels=" << inputChannels
                            << " inputHeight=" << inputSize
@@ -85,10 +77,10 @@ public:
                        batchSize, inputChannels, inputSize, inputSize};
                    TensorShape filter;
-                  if (layerType == depthwiseConvolutionType)
+                    if (groups > 1)
                      filter = TensorShape({groups,
                                            outputChannels / groups,
-                                          (size_t)1,
+                                            inputChannels / groups,
                                            filterSize,
                                            filterSize});
                    else
@@ -107,7 +99,8 @@ public:
                    } else if (type == kBackwardInputTest) {
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, output));
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, filter));
-                    test.addOutputs(BufferArg(VALUE_TYPE_FLOAT, input), ADD_TO);
+                      test.addOutputs(BufferArg(VALUE_TYPE_FLOAT, input),
+                                      ADD_TO);
                      test.run();
                    } else if (type == kBackwardFilterTest) {
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, output));
@@ -123,6 +116,7 @@ public:
        }
      }
    }
+  }
 };
 // Mainly used to test cases where the height and width (input, filter)
@@ -132,8 +126,8 @@ class ConvolutionTest2 {
 public:
  ConvolutionTest2(const std::string& conv1,
                   const std::string& conv2,
-                   LayerType layerType,
                   TestType type,
+                   bool useGroups = true,
                   std::string algo = "auto") {
    for (size_t batchSize : {16}) {
      for (size_t inputHeight : {7, 31}) {
@@ -142,15 +136,13 @@ public:
            for (size_t filterWidth : {3, 7}) {
              for (size_t inputChannels : {7}) {
                for (size_t outputChannels : {7, 32}) {
-                  if (layerType == depthwiseConvolutionType &&
+                  for (size_t groups : {1, 7}) {
-                      outputChannels % inputChannels != 0)
+                    if (!useGroups && groups != 1 &&
-                    break;
+                        (inputChannels != groups ||
+                         outputChannels % groups != 0))
+                      continue;
+                    if (!useGroups) groups = 1;
-                  size_t groups = 1;
-                  if (layerType == depthwiseConvolutionType) {
-                    groups = inputChannels;
-                  }
                    size_t stride = 1;
                    size_t padding = 0;
                    size_t outputHeight =
@@ -185,10 +177,10 @@ public:
                        batchSize, inputChannels, inputHeight, inputWidth};
                    TensorShape filter;
-                  if (layerType == depthwiseConvolutionType)
+                    if (groups > 1)
                      filter = TensorShape({groups,
                                            outputChannels / groups,
-                                          (size_t)1,
+                                            inputChannels / groups,
                                            filterHeight,
                                            filterWidth});
                    else
@@ -207,7 +199,8 @@ public:
                    } else if (type == kBackwardInputTest) {
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, output));
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, filter));
-                    test.addOutputs(BufferArg(VALUE_TYPE_FLOAT, input), ADD_TO);
+                      test.addOutputs(BufferArg(VALUE_TYPE_FLOAT, input),
+                                      ADD_TO);
                      test.run();
                    } else if (type == kBackwardFilterTest) {
                      test.addInputs(BufferArg(VALUE_TYPE_FLOAT, output));
@@ -223,109 +216,37 @@ public:
        }
      }
    }
+  }
 };
-// ======Start Convolution TEST======
 TEST(Forward, GEMM) {
  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_CPU> test(
-      "NaiveConv-CPU", "GemmConv-CPU", convolutionType, kForwardTest);
+      "NaiveConv-CPU", "GemmConv-CPU", kForwardTest, false);
  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_CPU> test2(
-      "NaiveConv-CPU", "GemmConv-CPU", convolutionType, kForwardTest);
+      "NaiveConv-CPU", "GemmConv-CPU", kForwardTest, false);
 }
 #ifndef PADDLE_ONLY_CPU
 TEST(Forward, GEMM2) {
  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test(
-      "GemmConv-CPU", "GemmConv-GPU", convolutionType, kForwardTest);
+      "GemmConv-CPU", "GemmConv-GPU", kForwardTest);
  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "GemmConv-CPU", "GemmConv-GPU", convolutionType, kForwardTest);
+      "GemmConv-CPU", "GemmConv-GPU", kForwardTest);
 }
 TEST(BackwardInput, GEMM) {
  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test(
-      "GemmConvGradInput-CPU",
+      "GemmConvGradInput-CPU", "GemmConvGradInput-GPU", kBackwardInputTest);
-      "GemmConvGradInput-GPU",
-      convolutionType,
-      kBackwardInputTest);
  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "GemmConvGradInput-CPU",
+      "GemmConvGradInput-CPU", "GemmConvGradInput-GPU", kBackwardInputTest);
-      "GemmConvGradInput-GPU",
-      convolutionType,
-      kBackwardInputTest);
 }
 TEST(BackwardFilter, GEMM) {
  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test(
-      "GemmConvGradFilter-CPU",
+      "GemmConvGradFilter-CPU", "GemmConvGradFilter-GPU", kBackwardFilterTest);
-      "GemmConvGradFilter-GPU",
-      convolutionType,
-      kBackwardFilterTest);
-  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "GemmConvGradFilter-CPU",
-      "GemmConvGradFilter-GPU",
-      convolutionType,
-      kBackwardFilterTest);
-}
-#endif
-// ======End Convolution TEST======
-// ======Start DepthwiseConvolution TEST======
-// TODO(zhaolong) The depthwise convolution cpu test will be added when the cpu
-// version of depthwiseConv is implemented.
-#ifndef PADDLE_ONLY_CPU
-TEST(DepthwiseConvForward, GEMM) {
-  ConvolutionTest<DEVICE_TYPE_GPU, DEVICE_TYPE_GPU> test(
-      "GemmConv-GPU",
-      "DepthwiseConv-GPU",
-      depthwiseConvolutionType,
-      kForwardTest);
-  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "GemmConv-GPU",
-      "DepthwiseConv-GPU",
-      depthwiseConvolutionType,
-      kForwardTest);
-}
-TEST(DepthwiseConvForward, GEMM2) {
-  ConvolutionTest<DEVICE_TYPE_GPU, DEVICE_TYPE_GPU> test(
-      "DepthwiseConv-GPU",
-      "DepthwiseConv-GPU",
-      depthwiseConvolutionType,
-      kForwardTest);
-  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "DepthwiseConv-GPU",
-      "DepthwiseConv-GPU",
-      depthwiseConvolutionType,
-      kForwardTest);
-}
-TEST(DepthwiseConvBackwardInput, GEMM) {
-  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test(
-      "DepthwiseConvGradInput-GPU",
-      "DepthwiseConvGradInput-GPU",
-      depthwiseConvolutionType,
-      kBackwardInputTest);
-  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "DepthwiseConvGradInput-GPU",
-      "DepthwiseConvGradInput-GPU",
-      depthwiseConvolutionType,
-      kBackwardInputTest);
-}
-TEST(DepthwiseConvBackwardFilter, GEMM) {
-  ConvolutionTest<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test(
-      "DepthwiseConvGradFilter-GPU",
-      "DepthwiseConvGradFilter-GPU",
-      depthwiseConvolutionType,
-      kBackwardFilterTest);
  ConvolutionTest2<DEVICE_TYPE_CPU, DEVICE_TYPE_GPU> test2(
-      "DepthwiseConvGradFilter-GPU",
+      "GemmConvGradFilter-CPU", "GemmConvGradFilter-GPU", kBackwardFilterTest);
-      "DepthwiseConvGradFilter-GPU",
-      depthwiseConvolutionType,
-      kBackwardFilterTest);
 }
 #endif
-// ======End DepthwiseConvolution TEST======
 }  // namespace paddle
--- a/paddle/gserver/layers/ExpandConvLayer.cpp
+++ b/paddle/gserver/layers/ExpandConvLayer.cpp
@@ -39,21 +39,22 @@ bool ExpandConvLayer::init(const LayerMap &layerMap,
  filterShape_.resize(numInputs);
  outputShape_.resize(numInputs);
-  string convType;
+  std::string convType;
-  string convGradInputType;
+  std::string convGradInputType;
-  string convGradFilterType;
+  std::string convGradFilterType;
  for (int i = 0; i < config_.inputs_size(); i++) {
    std::vector<size_t> paddings = {(size_t)paddingY_[i], (size_t)padding_[i]};
    std::vector<size_t> strides = {(size_t)strideY_[i], (size_t)stride_[i]};
    if (useGpu_ && (size_t)groups_[i] == (size_t)channels_[i] && !isDeconv_) {
-      convType = "DepthwiseConv" convGradInputType =
+      convType = "DepthwiseConv";
-          "DepthwiseConvGradInput" convGradFilterType =
+      convGradInputType = "DepthwiseConvGradInput";
-              "DepthwiseConvGradFilter"
+      convGradFilterType = "DepthwiseConvGradFilter";
    } else {
-      convType = "GemmConv" convGradInputType =
+      convType = "GemmConv";
-          "GemmConvGradInput" convGradFilterType = "GemmConvGradFilter"
+      convGradInputType = "GemmConvGradInput";
+      convGradFilterType = "GemmConvGradFilter";
    }
    if (FLAGS_use_nnpack) {

--- a/paddle/gserver/tests/test_LayerGrad.cpp
+++ b/paddle/gserver/tests/test_LayerGrad.cpp
@@ -349,13 +349,13 @@ TEST(Layer, CosSimVecMatLayer) {
 void testDepthwiseConvLayer(const string& type, bool useGpu) {
  TestConfig config;
-  config.biasSize = 16;
+  config.biasSize = 32;
  config.layerConfig.set_type(type);
-  config.layerConfig.set_num_filters(16);
+  config.layerConfig.set_num_filters(32);
  config.layerConfig.set_partial_sum(1);
  config.layerConfig.set_shared_biases(true);
-  config.inputDefs.push_back({INPUT_DATA, "layer_0", 2048, 192 / 2});
+  config.inputDefs.push_back({INPUT_DATA, "layer_0", 2048, 192});
  LayerInputConfig* input = config.layerConfig.add_inputs();
  ConvConfig* conv = input->mutable_conv_conf();
  conv->set_filter_size(2);
@@ -388,8 +388,11 @@ void testDepthwiseConvLayer(const string& type, bool useGpu) {
 }
 TEST(Layer, depthwiseConvLayer) {
+  //  'depthwise_conv' is a sepecial case of 'exconv' whose
+  //  groups size equals to the input channels size.
+  testDepthwiseConvLayer("exconv", /* useGpu= */ false);
 #ifndef PADDLE_ONLY_CPU
-  testDepthwiseConvLayer("depthwise_conv", /* useGpu= */ true);
+  testDepthwiseConvLayer("exconv", /* useGpu= */ true);
 #endif
 }