Fix CrossMapNormalGradFunc

a9228e2a · hedaoyuan · c4437fa2 · a9228e2a · a9228e2a
隐藏空白更改
内联并排

Showing with 43 addition and 21 deletion

paddle/function/CrossMapNormalOp.cpp paddle/function/CrossMapNormalOp.cpp +39 -20

paddle/function/Function.h paddle/function/Function.h +4 -1

未找到文件。
--- a/paddle/function/CrossMapNormalOp.cpp
+++ b/paddle/function/CrossMapNormalOp.cpp
@@ -196,8 +196,8 @@ public:
  }
  void check(const BufferArgs& inputs, const BufferArgs& outputs) override {
-    CHECK_EQ((size_t)numInputs_, inputs.size());
+    CHECK_EQ(numInputs_, inputs.size());
-    CHECK_EQ((size_t)numOutputs_, outputs.size());
+    CHECK_EQ(numOutputs_, outputs.size());
    CHECK_EQ(inputs[0].shape().ndims(), (size_t)4);
    CHECK(inputs[0].shape() == outputs[0].shape());
@@ -215,7 +215,7 @@ public:
    // number of floating-point operations
    // an approximate value
-    size_t ops = batchSize * maps * ((rows * columns) * size_);
+    size_t ops = batchSize * maps * rows * columns * (size_ * 2 + 3);
    return ops;
  }
@@ -273,15 +273,7 @@ public:
  }
  void calc(const BufferArgs& inputs, const BufferArgs& outputs) override {
-    CHECK_EQ((size_t)numInputs_, inputs.size());
+    check(inputs, outputs);
-    CHECK_EQ((size_t)numOutputs_, outputs.size());
-    CHECK_EQ(inputs[0].shape().ndims(), (size_t)4);
-    CHECK(inputs[0].shape() == inputs[1].shape());
-    CHECK(inputs[0].shape() == inputs[2].shape());
-    CHECK(inputs[0].shape() == inputs[3].shape());
-    CHECK(inputs[0].shape() == outputs[0].shape());
    if (outputs[0].getArgType() != ADD_TO) {
      // Currently, some algorithm implementations are ASSIGN_TO mode,
      // if need to support the ADD_TO calculation, need to clear the output.
@@ -290,25 +282,52 @@ public:
      tmp.zero();
    }
-    size_t samples = inputs[0].shape()[0];
+    size_t batchSize = inputs[0].shape()[0];
-    size_t channels = inputs[0].shape()[1];
+    size_t maps = inputs[0].shape()[1];
-    size_t height = inputs[0].shape()[2];
+    size_t rows = inputs[0].shape()[2];
-    size_t width = inputs[0].shape()[3];
+    size_t columns = inputs[0].shape()[3];
    CrossMapNormalGrad<Device>(outputs[0].data<real>(),
                               inputs[0].data<real>(),
                               inputs[1].data<real>(),
                               inputs[2].data<real>(),
                               inputs[3].data<real>(),
-                               samples,
+                               batchSize,
-                               channels,
+                               maps,
-                               height,
+                               rows,
-                               width,
+                               columns,
                               size_,
                               scale_,
                               pow_);
  }
+  void check(const BufferArgs& inputs, const BufferArgs& outputs) override {
+    CHECK_EQ(numInputs_, inputs.size());
+    CHECK_EQ(numOutputs_, outputs.size());
+    CHECK_EQ(inputs[0].shape().ndims(), (size_t)4);
+    CHECK(inputs[0].shape() == inputs[1].shape());
+    CHECK(inputs[0].shape() == inputs[2].shape());
+    CHECK(inputs[0].shape() == inputs[3].shape());
+    CHECK(inputs[0].shape() == outputs[0].shape());
+  }
+  // Only need the shape of one input, can calculate the
+  // floating-point operation.
+  size_t ops(const BufferArgs& inputs, const BufferArgs& outputs) override {
+    CHECK_LT((size_t)1, inputs.size());
+    size_t batchSize = inputs[0].shape()[0];
+    size_t maps = inputs[0].shape()[1];
+    size_t rows = inputs[0].shape()[2];
+    size_t columns = inputs[0].shape()[3];
+    // number of floating-point operations
+    // an approximate value
+    size_t ops = batchSize * maps * rows * columns * (size_ * 4 + 2);
+    return ops;
+  }
 private:
  size_t size_;
  real scale_;

--- a/paddle/function/Function.h
+++ b/paddle/function/Function.h
@@ -156,12 +156,15 @@ public:
  // This member function is used to check whether the BufferType and shape of
  // the inputs and outputs arguments of the Function are correct.
  // General calc function which will call this check to do arguments check.
-  // Also before the call calc, the caller can also check their own arguments.
+  // And before the calc called, the caller can also check their own arguments.
  virtual void check(const BufferArgs& inputs, const BufferArgs& outputs) {}
  // Calculate the number of floating-point operations of this Function.
  // The inputs and outputs arguments do not need to contain the actual data,
  // only the shape.
+  // And some Functions have the same input and output shapes,
+  // so you may not need to enter the complete number of arguments.
+  // But entering the full arguments is always correct for this interface.
  virtual size_t ops(const BufferArgs& inputs, const BufferArgs& outputs) {
    return 0;
  }