improve doc in margin_rank_loss_op

13b7d928 · Yibing Liu · 240adef1 · 13b7d928 · 13b7d928
显示空白变更内容
内联并排

Showing with 21 addition and 15 deletion

paddle/operators/margin_rank_loss_op.cc paddle/operators/margin_rank_loss_op.cc +19 -13

paddle/operators/margin_rank_loss_op.h paddle/operators/margin_rank_loss_op.h +2 -2

未找到文件。
--- a/paddle/operators/margin_rank_loss_op.cc
+++ b/paddle/operators/margin_rank_loss_op.cc
@@ -22,7 +22,7 @@ class MarginRankLossOp : public framework::OperatorWithKernel {
  using framework::OperatorWithKernel::OperatorWithKernel;
 protected:
-  void InferShape(framework::InferShapeContextBase *ctx) const override {
+  void InferShape(framework::InferShapeContext *ctx) const override {
    // input check
    PADDLE_ENFORCE(ctx->HasInput("Label"), "Input(Label) shouldn't be null.");
    PADDLE_ENFORCE(ctx->HasInput("X1"), "Input(X1) shouldn't be null.");
@@ -47,11 +47,11 @@ class MarginRankLossOpMaker : public framework::OpProtoAndCheckerMaker {
                        framework::OpAttrChecker *op_checker)
      : OpProtoAndCheckerMaker(proto, op_checker) {
    AddInput("X1",
-             "(2-D tensor with shape [batch_size x 1]) In pairwise ranking, "
+             "(2-D tensor with shape [batch_size x 1]) The score for "
-             "X1 is the score for one item to be ranked.");
+             "one item X1 to be ranked, from pairwise ranking model.");
    AddInput("X2",
-             "(2-D tensor with shape [batch_size x 1]) In pairwise ranking, "
+             "(2-D tensor with shape [batch_size x 1]) The score for "
-             "X2 is the score for another item to be ranked.");
+             "another item X2 to be ranked, from pairwise ranking model.");
    AddInput("Label",
             "(2-D tensor with shape [batch_size x 1]) "
             "The label indicating X1 ranked higher than X2 or not, "
@@ -63,19 +63,25 @@ class MarginRankLossOpMaker : public framework::OpProtoAndCheckerMaker {
              "to indicate whether each element of Output(Out) is activated.")
        .AsIntermediate();
    AddOutput("Out",
-              "(2-D tensor with shape [batch_size x 1])"
+              "(2-D tensor with shape [batch_size x 1]) "
              "The output loss of MarginRankLoss operator.");
    AddComment(R"DOC(
-MarginRankLoss operator measures the loss given a pair of input {`X1`, `X2`}
+MarginRankLoss operator measures the loss given a pair of training sample
-and the `Label` with attribute `margin`, where `Label = +1` indicating X1 is
+{`X1`, `X2`} and the `Label` with attribute `margin`, where `Label = +1` 
-ranked higher than `X2`, otherwise `Label = -1`. The loss turns out
+indicating X1 is ranked higher than `X2`, otherwise `Label = -1`. The loss 
+turns out
-loss(X1, X2, Label) = max(0, -Label * (X1 - X2) + margin)
+loss(X1, X2, Label) = max(0, -Label * (X1 - X2) + margin).
 The attribute `margin` involved here helps make the predictions more robust.
-Only when the difference between `X1` and `X2` is greater than `margin`, it is
+Denote the item ranked higher as the positive sample, otherwise negative 
-possible for these two items contribute to the final loss.
+sample. If the score of the two samples statisfies 
+positive sample - negative sample < margin,
+the pair of samples will contribute to the loss, which will backpropogate and 
+train the ranking model to enlarge the difference of the two score.
 For batch input with size `batch_size`, `X1`, `X2` and `Label`
 all have the same shape [batch_size x 1].
@@ -89,7 +95,7 @@ class MarginRankLossGradOp : public framework::OperatorWithKernel {
  using framework::OperatorWithKernel::OperatorWithKernel;
 protected:
-  void InferShape(framework::InferShapeContextBase *ctx) const override {
+  void InferShape(framework::InferShapeContext *ctx) const override {
    PADDLE_ENFORCE(ctx->HasInput("Label"), "Input(Label) shouldn't be null.");
    PADDLE_ENFORCE(ctx->HasInput("X1"), "Input(X1) shouldn't be null.");
    PADDLE_ENFORCE(ctx->HasInput("X2"), "Input(X2) shouldn't be null.");

--- a/paddle/operators/margin_rank_loss_op.h
+++ b/paddle/operators/margin_rank_loss_op.h
@@ -35,7 +35,7 @@ struct Heaviside {
 };
 template <typename Place, typename T>
-class MarginRankLossKernel : public framework::OpKernel {
+class MarginRankLossKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const {
    auto* out_t = ctx.Output<framework::Tensor>("Out");
@@ -63,7 +63,7 @@ class MarginRankLossKernel : public framework::OpKernel {
 };
 template <typename Place, typename T>
-class MarginRankLossGradKernel : public framework::OpKernel {
+class MarginRankLossGradKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const {
    auto* d_x1_t =