detection_output_op.cc 4.0 KB
Newer Older
S
sweetsky0901 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
Indicesou may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#include "paddle/operators/detection_output_op.h"
namespace paddle {
namespace operators {

class Detection_output_OpMaker : public framework::OpProtoAndCheckerMaker {
 public:
  Detection_output_OpMaker(framework::OpProto* proto,
                           framework::OpAttrChecker* op_checker)
      : OpProtoAndCheckerMaker(proto, op_checker) {
S
sweetsky0901 已提交
24
    AddInput("Loc",
S
sweetsky0901 已提交
25 26
             "(Tensor) The input tensor of detection_output operator."
             "The input predict locations"
S
sweetsky0901 已提交
27 28 29 30 31
             "The format of input tensor is kNCHW. Where K is priorbox point "
             "numbers,"
             "N is How many boxes are there on each point, "
             "C is 4, H and W both are 1.");
    AddInput("Conf",
S
sweetsky0901 已提交
32 33
             "(Tensor) The input tensor of detection_output operator."
             "The input priorbox confidence."
S
sweetsky0901 已提交
34 35 36 37 38
             "The format of input tensor is kNCHW. Where K is priorbox point "
             "numbers,"
             "N is How many boxes are there on each point, "
             "C is the number of classes, H and W both are 1.");
    AddInput("PriorBox",
S
sweetsky0901 已提交
39
             "(Tensor) The input tensor of detection_output operator."
S
sweetsky0901 已提交
40 41
             "The format of input tensor is the position and variance "
             "of the boxes");
S
sweetsky0901 已提交
42
    AddOutput("Out",
S
sweetsky0901 已提交
43
              "(Tensor) The output tensor of detection_output operator.");
S
sweetsky0901 已提交
44 45
    AddAttr<int>("background_label_id", "(int), The background class index.");
    AddAttr<int>("num_classes", "(int), The number of the classification.");
S
sweetsky0901 已提交
46
    AddAttr<float>("nms_threshold",
S
sweetsky0901 已提交
47
                   "(float), The Non-maximum suppression threshold.");
S
sweetsky0901 已提交
48
    AddAttr<float>("confidence_threshold",
S
sweetsky0901 已提交
49 50 51 52
                   "(float), The classification confidence threshold.");
    AddAttr<int>("top_k", "(int), The bbox number kept of the layer’s output.");
    AddAttr<int>("nms_top_k",
                 "(int), The bbox number kept of the NMS’s output.");
S
sweetsky0901 已提交
53
    AddComment(R"DOC(
S
sweetsky0901 已提交
54
          detection output for SSD(single shot multibox detector)
S
sweetsky0901 已提交
55 56 57
          Apply the NMS to the output of network and compute the predict
          bounding box location. The output’s shape of this layer could
          be zero if there is no valid bounding box.
S
sweetsky0901 已提交
58 59 60 61 62 63 64 65
        )DOC");
  }
};

class Detection_output_Op : public framework::OperatorWithKernel {
 public:
  using framework::OperatorWithKernel::OperatorWithKernel;
  void InferShape(framework::InferShapeContext* ctx) const override {
66 67 68 69 70 71 72
    PADDLE_ENFORCE(ctx->HasInput("Loc"),
                   "Input(X) of Detection_output_Op"
                   "should not be null.");
    PADDLE_ENFORCE(ctx->HasInput("Conf"),
                   "Input(X) of Detection_output_Op"
                   "should not be null.");
    PADDLE_ENFORCE(ctx->HasInput("PriorBox"),
S
sweetsky0901 已提交
73 74 75 76
                   "Input(X) of Detection_output_Op"
                   "should not be null.");
    PADDLE_ENFORCE(ctx->HasOutput("Out"),
                   "Output(Out) of Detection_output_Op should not be null.");
77
    std::vector<int64_t> output_shape({1, 7});
S
sweetsky0901 已提交
78 79 80 81 82 83 84 85 86 87 88 89 90
    ctx->SetOutputDim("Out", framework::make_ddim(output_shape));
  }
};
}  // namespace operators
}  // namespace paddle

namespace ops = paddle::operators;
REGISTER_OP_WITHOUT_GRADIENT(detection_output, ops::Detection_output_Op,
                             ops::Detection_output_OpMaker);
REGISTER_OP_CPU_KERNEL(
    detection_output,
    ops::Detection_output_Kernel<paddle::platform::CPUPlace, float>,
    ops::Detection_output_Kernel<paddle::platform::CPUPlace, double>);