auc_op.cc 3.7 KB
Newer Older
T
typhoonzero 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/operators/auc_op.h"

namespace paddle {
namespace operators {

T
update  
typhoonzero 已提交
20
class AucOp : public framework::OperatorWithKernel {
T
typhoonzero 已提交
21 22 23 24
 public:
  using framework::OperatorWithKernel::OperatorWithKernel;

 protected:
武毅 已提交
25
  void InferShape(framework::InferShapeContext *ctx) const override {
26
    PADDLE_ENFORCE(ctx->HasInput("Out"), "Input of Out should not be null.");
武毅 已提交
27
    PADDLE_ENFORCE(ctx->HasInput("Indices"),
28
                   "Input of Indices should not be null.");
T
typhoonzero 已提交
29
    PADDLE_ENFORCE(ctx->HasInput("Label"),
30
                   "Input of Label should not be null.");
武毅 已提交
31 32
    auto inference_height = ctx->GetInputDim("Out")[0];
    auto label_height = ctx->GetInputDim("Label")[0];
T
typhoonzero 已提交
33

武毅 已提交
34 35
    PADDLE_ENFORCE_EQ(inference_height, label_height,
                      "Out and Label should have same height.");
T
typhoonzero 已提交
36

T
typhoonzero 已提交
37
    ctx->SetOutputDim("AUC", {1});
武毅 已提交
38 39 40 41
    ctx->ShareLoD("Out", /*->*/ "AUC");
  }

 protected:
Y
Yu Yang 已提交
42
  framework::OpKernelType GetKernelType(
武毅 已提交
43
      const framework::ExecutionContext &ctx) const override {
Y
Yu Yang 已提交
44 45 46
    return framework::OpKernelType(
        framework::ToDataType(ctx.Input<Tensor>("Out")->type()),
        ctx.device_context());
T
typhoonzero 已提交
47 48 49 50 51 52 53
  }
};

class AucOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
  AucOpMaker(framework::OpProto *proto, framework::OpAttrChecker *op_checker)
      : OpProtoAndCheckerMaker(proto, op_checker) {
武毅 已提交
54 55
    AddInput("Out",
             "A floating point 2D tensor, values are in the range [0, 1]."
56
             "Each row is sorted in descending order. This input should be the"
武毅 已提交
57 58 59 60
             "output of topk."
             "Typically, this tensor indicates the probability of each label");
    AddInput("Indices",
             "An int 2D tensor, indicating the indices of original"
61 62
             "tensor before sorting. Typically, this tensor indicates which "
             "label the probability stands for.");
T
auc_op  
typhoonzero 已提交
63
    AddInput("Label",
武毅 已提交
64 65
             "A 2D int tensor indicating the label of the training data."
             "The height is batch size and width is always 1.");
T
auc_op  
typhoonzero 已提交
66 67
    // TODO(typhoonzero): support weight input
    AddOutput("AUC",
T
typhoonzero 已提交
68
              "A scalar representing the "
69
              "current area-under-the-curve.");
T
typhoonzero 已提交
70

T
typhoonzero 已提交
71
    AddAttr<std::string>("curve", "Curve type, can be 'ROC' or 'PR'.")
T
typhoonzero 已提交
72 73 74 75 76 77
        .SetDefault("ROC");
    AddAttr<int>("num_thresholds",
                 "The number of thresholds to use when discretizing the"
                 " roc curve.")
        .SetDefault(200);

78 79
    AddComment(R"DOC(
Area Under The Curve (AUC) Operator.
武毅 已提交
80

81 82
This implementation computes the AUC according to forward output and label.
It is used very widely in binary classification evaluation. As a note:
武毅 已提交
83
If input label contains values other than 0 and 1, it will be cast
84
to bool. You can find the relevant definitions here:
武毅 已提交
85 86
https://en.wikipedia.org/wiki/Receiver_operating_characteristic#Area_under_the_curve

87 88 89
There are two types of possible curves:
1. ROC: Receiver operating characteristic
2. PR: Precision Recall
武毅 已提交
90
)DOC");
T
typhoonzero 已提交
91 92 93 94 95 96 97
  }
};

}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;
T
update  
typhoonzero 已提交
98
REGISTER_OP_WITHOUT_GRADIENT(auc, ops::AucOp, ops::AucOpMaker);
T
typhoonzero 已提交
99
REGISTER_OP_CPU_KERNEL(auc, ops::AucKernel<paddle::platform::CPUPlace, float>);