quantize_op.cc 2.4 KB
Newer Older
X
xiaoli.liu@intel.com 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 *     Unless required by applicable law or agreed to in writing, software
 *     distributed under the License is distributed on an "AS IS" BASIS,
 *     WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *     See the License for the specific language governing permissions and
 *     limitations under the License. */

#include "paddle/fluid/operators/quantize_op.h"
16
#include "paddle/fluid/framework/op_version_registry.h"
X
xiaoli.liu@intel.com 已提交
17 18 19 20 21 22 23 24 25 26 27 28
#ifdef PADDLE_WITH_MKLDNN
#include "paddle/fluid/platform/mkldnn_helper.h"
#endif

namespace paddle {
namespace operators {

framework::OpKernelType QuantOp::GetExpectedKernelType(
    const framework::ExecutionContext& ctx) const {
  framework::LibraryType library_ = framework::LibraryType::kMKLDNN;
  framework::DataLayout layout_ = framework::DataLayout::kMKLDNN;

29 30 31
  return framework::OpKernelType(
      OperatorWithKernel::IndicateVarDataType(ctx, "Input"), ctx.GetPlace(),
      layout_, library_);
X
xiaoli.liu@intel.com 已提交
32 33 34
}

void QuantOpMaker::Make() {
35 36
  AddInput("Input", "Input data");
  AddOutput("Output", "Output data");
X
xiaoli.liu@intel.com 已提交
37 38 39
  AddAttr<bool>("is_negative_input",
                "(bool, default false) Only used in mkldnn INT8 kernel")
      .SetDefault(false);
40 41 42 43 44
  AddAttr<float>("Scale", "Scale data").SetDefault({1.0f});
  AddAttr<float>(
      "Shift",
      "Shift data. When Shift is non-zero, data is quantized to unsigned int8.")
      .SetDefault({0.0f});
45 46 47
  AddAttr<std::string>("output_format",
                       "Convert format to NHWC or NCHW during quantization.")
      .SetDefault("NHWC");
48 49
  AddAttr<bool>("bfloat16", "(bool, default false) Convert to bfloat16")
      .SetDefault(false);
X
xiaoli.liu@intel.com 已提交
50 51 52 53 54 55 56
  AddComment(R"DOC(This op will quantize data from FP32 to INT8)DOC");
}

}  // namespace operators
}  // namespace paddle
namespace ops = paddle::operators;

57
REGISTER_OPERATOR(quantize, ops::QuantOp, ops::QuantOpMaker);
58 59 60 61 62 63 64

REGISTER_OP_VERSION(quantize)
    .AddCheckpoint(
        R"ROC( Add a new attribute [bfloat16])ROC",
        paddle::framework::compatible::OpVersionDesc().NewAttr(
            "bfloat16", "If true, float32 input is converted to bfloat16",
            false));