From dbc63555f35a7263a37d77c9a736df3787cb75f0 Mon Sep 17 00:00:00 2001
From: wenbin <wang3323032@qq.com>
Date: Thu, 17 Nov 2022 17:24:18 +0800
Subject: [PATCH] support int input for scale (#48044)

* int scale

* round

* revert commit
---
 .../inference/tensorrt/convert/scale_op.cc    |   8 +-
 paddle/fluid/inference/tensorrt/op_teller.cc  |  25 +++-
 .../ir/inference/test_trt_convert_scale.py    | 138 +++++++++++-------
 3 files changed, 106 insertions(+), 65 deletions(-)
diff --git a/paddle/fluid/inference/tensorrt/convert/scale_op.cc b/paddle/fluid/inference/tensorrt/convert/scale_op.cc
index d770c21a9ad..361ed223955 100644
--- a/paddle/fluid/inference/tensorrt/convert/scale_op.cc
+++ b/paddle/fluid/inference/tensorrt/convert/scale_op.cc
@@ -49,9 +49,12 @@ class ScaleOpConverter : public OpConverter {
         PADDLE_GET_CONST(bool, op_desc.GetAttr("bias_after_scale"));
     float bias = PADDLE_GET_CONST(float, op_desc.GetAttr("bias"));
     float scale = PADDLE_GET_CONST(float, op_desc.GetAttr("scale"));
+    bool is_int = input->getType() == nvinfer1::DataType::kINT32;
     nvinfer1::ILayer* layer = nullptr;
     if (engine_->with_dynamic_shape()) {
-      nvinfer1::ITensor* bias_tensor = Add1DConstantLayer(bias);
+      nvinfer1::ITensor* bias_tensor =
+          is_int ? Add1DConstantLayer(static_cast<int>(bias))
+                 : Add1DConstantLayer(bias);
       bool is_bias_0 = (bias < 1e-06 && bias > -1e-06);
 
       std::vector<int32_t> bias_shapes(input->getDimensions().nbDims, 1);
@@ -72,7 +75,8 @@ class ScaleOpConverter : public OpConverter {
         is_scale_1 = false;
       } else {
         has_scale_tensor = false;
-        scale_tensor = Add1DConstantLayer(scale);
+        scale_tensor = is_int ? Add1DConstantLayer(static_cast<int>(scale))
+                              : Add1DConstantLayer(scale);
         is_scale_1 = ((scale - 1.0) < 1e-06 && (scale - 1.0) > -1e-06);
       }
 
diff --git a/paddle/fluid/inference/tensorrt/op_teller.cc b/paddle/fluid/inference/tensorrt/op_teller.cc
index dfe1b2ca623..f27c006f208 100644
--- a/paddle/fluid/inference/tensorrt/op_teller.cc
+++ b/paddle/fluid/inference/tensorrt/op_teller.cc
@@ -1076,13 +1076,24 @@ struct SimpleOpTypeSetTeller : public Teller {
       auto* x_var_desc = block->FindVar(x_var_name);
       const auto x_shape = x_var_desc->GetShape();
       auto dtype = x_var_desc->GetDataType();
-      // At present, only support float32 or float16 into trt.
-      if (!(dtype == 5 || dtype == 4)) {
-        return false;
-      }
-      if (!with_dynamic_shape && x_shape.size() == 1) {
-        VLOG(3) << "Scale op does not support 1-dimensional input in tensorrt";
-        return false;
+      if (!with_dynamic_shape) {
+        // At present, only support float32 or float16 into trt.
+        if (!(dtype == framework::proto::VarType::FP32 ||
+              dtype == framework::proto::VarType::FP16)) {
+          return false;
+        }
+        if (x_shape.size() == 1) {
+          VLOG(3)
+              << "Scale op does not support 1-dimensional input in tensorrt";
+          return false;
+        }
+      } else {
+        // At present, only support float32 or float16 or int32 into trt.
+        if (!(dtype == framework::proto::VarType::FP32 ||
+              dtype == framework::proto::VarType::FP16 ||
+              dtype == framework::proto::VarType::INT32)) {
+          return false;
+        }
       }
     }
 
diff --git a/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py b/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py
index 27658d92863..5e11bec6849 100644
--- a/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py
+++ b/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py
@@ -26,18 +26,24 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
         return True
 
     def sample_program_configs(self):
-        def generate_input1(attrs: List[Dict[str, Any]], batch):
+        def generate_input1(attrs: List[Dict[str, Any]], batch, is_int):
             if self.dims == 4:
-                return np.ones([batch, 3, 24, 24]).astype(np.float32)
+                return np.ones([batch, 3, 24, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
             elif self.dims == 3:
-                return np.ones([batch, 3, 24]).astype(np.float32)
+                return np.ones([batch, 3, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
             elif self.dims == 2:
-                return np.ones([batch, 24]).astype(np.float32)
+                return np.ones([batch, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
             elif self.dims == 1:
-                return np.ones([24]).astype(np.float32)
+                return np.ones([24]).astype(np.int32 if is_int else np.float32)
 
-        def generate_weight1(attrs: List[Dict[str, Any]]):
-            return np.ones([1]).astype(np.float32)
+        def generate_weight1(attrs: List[Dict[str, Any]], is_int):
+            return np.ones([1]).astype(np.int32 if is_int else np.float32)
 
         for num_input in [0, 1]:
             for dims in [1, 2, 3, 4]:
@@ -45,58 +51,67 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
                     for scale in [0.1, -1.0]:
                         for bias in [0.0, 1.2]:
                             for bias_after_scale in [False, True]:
-                                self.num_input = num_input
-                                self.dims = dims
-                                dics = [
-                                    {
-                                        "scale": scale,
-                                        "bias": bias,
-                                        "bias_after_scale": bias_after_scale,
-                                    },
-                                    {},
-                                ]
-
-                                dics_intput = [
-                                    {
-                                        "X": ["scale_input"],
-                                        "ScaleTensor": ["ScaleTensor"],
-                                    },
-                                    {"X": ["scale_input"]},
-                                ]
-                                dics_intputs = [
-                                    {
-                                        "ScaleTensor": TensorConfig(
-                                            data_gen=partial(
-                                                generate_weight1, dics
+                                for is_int in [False, True]:
+                                    self.num_input = num_input
+                                    self.dims = dims
+                                    self.is_int = is_int
+                                    dics = [
+                                        {
+                                            "scale": scale,
+                                            "bias": bias,
+                                            "bias_after_scale": bias_after_scale,
+                                        },
+                                        {},
+                                    ]
+
+                                    dics_intput = [
+                                        {
+                                            "X": ["scale_input"],
+                                            "ScaleTensor": ["ScaleTensor"],
+                                        },
+                                        {"X": ["scale_input"]},
+                                    ]
+                                    dics_intputs = [
+                                        {
+                                            "ScaleTensor": TensorConfig(
+                                                data_gen=partial(
+                                                    generate_weight1,
+                                                    dics,
+                                                    is_int,
+                                                )
                                             )
-                                        )
-                                    },
-                                    {},
-                                ]
-
-                                ops_config = [
-                                    {
-                                        "op_type": "scale",
-                                        "op_inputs": dics_intput[num_input],
-                                        "op_outputs": {"Out": ["scale_out"]},
-                                        "op_attrs": dics[0],
-                                    }
-                                ]
-                                ops = self.generate_op_config(ops_config)
-                                program_config = ProgramConfig(
-                                    ops=ops,
-                                    weights=dics_intputs[num_input],
-                                    inputs={
-                                        "scale_input": TensorConfig(
-                                            data_gen=partial(
-                                                generate_input1, dics, batch
+                                        },
+                                        {},
+                                    ]
+
+                                    ops_config = [
+                                        {
+                                            "op_type": "scale",
+                                            "op_inputs": dics_intput[num_input],
+                                            "op_outputs": {
+                                                "Out": ["scale_out"]
+                                            },
+                                            "op_attrs": dics[0],
+                                        }
+                                    ]
+                                    ops = self.generate_op_config(ops_config)
+                                    program_config = ProgramConfig(
+                                        ops=ops,
+                                        weights=dics_intputs[num_input],
+                                        inputs={
+                                            "scale_input": TensorConfig(
+                                                data_gen=partial(
+                                                    generate_input1,
+                                                    dics,
+                                                    batch,
+                                                    is_int,
+                                                )
                                             )
-                                        )
-                                    },
-                                    outputs=["scale_out"],
-                                )
+                                        },
+                                        outputs=["scale_out"],
+                                    )
 
-                                yield program_config
+                                    yield program_config
 
     def sample_predictor_configs(
         self, program_config
@@ -182,6 +197,17 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
             "INPUT DIM EQUAL TO 1 OF STATIC SHAPE NOT SUPPORT",
         )
 
+        def teller3(program_config, predictor_config):
+            if self.is_int and len(self.dynamic_shape.min_input_shape) == 0:
+                return True
+            return False
+
+        self.add_skip_case(
+            teller3,
+            SkipReasons.TRT_NOT_SUPPORT,
+            "INTEGER INPUT OF STATIC SHAPE NOT SUPPORT",
+        )
+
     def test(self):
         self.add_skip_trt_case()
         self.run_test()
-- 
GitLab