auc_op.cc 3.7 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
T
typhoonzero 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

Y
Yi Wang 已提交
15
#include "paddle/fluid/operators/auc_op.h"
16
#include <string>
T
typhoonzero 已提交
17 18 19 20

namespace paddle {
namespace operators {

T
update  
typhoonzero 已提交
21
class AucOp : public framework::OperatorWithKernel {
T
typhoonzero 已提交
22 23 24 25
 public:
  using framework::OperatorWithKernel::OperatorWithKernel;

 protected:
武毅 已提交
26
  void InferShape(framework::InferShapeContext *ctx) const override {
27
    PADDLE_ENFORCE(ctx->HasInput("Out"), "Input of Out should not be null.");
武毅 已提交
28
    PADDLE_ENFORCE(ctx->HasInput("Indices"),
29
                   "Input of Indices should not be null.");
T
typhoonzero 已提交
30
    PADDLE_ENFORCE(ctx->HasInput("Label"),
31
                   "Input of Label should not be null.");
武毅 已提交
32 33
    auto inference_height = ctx->GetInputDim("Out")[0];
    auto label_height = ctx->GetInputDim("Label")[0];
T
typhoonzero 已提交
34

武毅 已提交
35 36
    PADDLE_ENFORCE_EQ(inference_height, label_height,
                      "Out and Label should have same height.");
T
typhoonzero 已提交
37

T
typhoonzero 已提交
38
    ctx->SetOutputDim("AUC", {1});
武毅 已提交
39 40 41 42
    ctx->ShareLoD("Out", /*->*/ "AUC");
  }

 protected:
43
  framework::OpKernelType GetExpectedKernelType(
武毅 已提交
44
      const framework::ExecutionContext &ctx) const override {
Y
Yu Yang 已提交
45 46 47
    return framework::OpKernelType(
        framework::ToDataType(ctx.Input<Tensor>("Out")->type()),
        ctx.device_context());
T
typhoonzero 已提交
48 49 50 51 52
  }
};

class AucOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
53
  AucOpMaker(OpProto *proto, OpAttrChecker *op_checker)
T
typhoonzero 已提交
54
      : OpProtoAndCheckerMaker(proto, op_checker) {
武毅 已提交
55 56
    AddInput("Out",
             "A floating point 2D tensor, values are in the range [0, 1]."
57
             "Each row is sorted in descending order. This input should be the"
武毅 已提交
58 59 60 61
             "output of topk."
             "Typically, this tensor indicates the probability of each label");
    AddInput("Indices",
             "An int 2D tensor, indicating the indices of original"
62 63
             "tensor before sorting. Typically, this tensor indicates which "
             "label the probability stands for.");
T
auc_op  
typhoonzero 已提交
64
    AddInput("Label",
武毅 已提交
65 66
             "A 2D int tensor indicating the label of the training data."
             "The height is batch size and width is always 1.");
T
auc_op  
typhoonzero 已提交
67 68
    // TODO(typhoonzero): support weight input
    AddOutput("AUC",
T
typhoonzero 已提交
69
              "A scalar representing the "
70
              "current area-under-the-curve.");
T
typhoonzero 已提交
71

T
typhoonzero 已提交
72
    AddAttr<std::string>("curve", "Curve type, can be 'ROC' or 'PR'.")
T
typhoonzero 已提交
73 74 75 76 77 78
        .SetDefault("ROC");
    AddAttr<int>("num_thresholds",
                 "The number of thresholds to use when discretizing the"
                 " roc curve.")
        .SetDefault(200);

79 80
    AddComment(R"DOC(
Area Under The Curve (AUC) Operator.
武毅 已提交
81

82 83
This implementation computes the AUC according to forward output and label.
It is used very widely in binary classification evaluation. As a note:
武毅 已提交
84
If input label contains values other than 0 and 1, it will be cast
85
to bool. You can find the relevant definitions here:
武毅 已提交
86 87
https://en.wikipedia.org/wiki/Receiver_operating_characteristic#Area_under_the_curve

88 89 90
There are two types of possible curves:
1. ROC: Receiver operating characteristic
2. PR: Precision Recall
武毅 已提交
91
)DOC");
T
typhoonzero 已提交
92 93 94 95 96 97 98
  }
};

}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;
T
update  
typhoonzero 已提交
99
REGISTER_OP_WITHOUT_GRADIENT(auc, ops::AucOp, ops::AucOpMaker);
T
typhoonzero 已提交
100
REGISTER_OP_CPU_KERNEL(auc, ops::AucKernel<paddle::platform::CPUPlace, float>);