support int input for scale (#48044)

* int scale * round * revert commit

support int input for scale (#48044)
* int scale * round * revert commit
dbc63555 · wenbin · GitHub · 5329187d · dbc63555 · dbc63555
3 changed file
--- a/paddle/fluid/inference/tensorrt/convert/scale_op.cc
+++ b/paddle/fluid/inference/tensorrt/convert/scale_op.cc
@@ -49,9 +49,12 @@ class ScaleOpConverter : public OpConverter {
        PADDLE_GET_CONST(bool, op_desc.GetAttr("bias_after_scale"));
    float bias = PADDLE_GET_CONST(float, op_desc.GetAttr("bias"));
    float scale = PADDLE_GET_CONST(float, op_desc.GetAttr("scale"));
+    bool is_int = input->getType() == nvinfer1::DataType::kINT32;
    nvinfer1::ILayer* layer = nullptr;
    if (engine_->with_dynamic_shape()) {
-      nvinfer1::ITensor* bias_tensor = Add1DConstantLayer(bias);
+      nvinfer1::ITensor* bias_tensor =
+          is_int ? Add1DConstantLayer(static_cast<int>(bias))
+                 : Add1DConstantLayer(bias);
      bool is_bias_0 = (bias < 1e-06 && bias > -1e-06);
      std::vector<int32_t> bias_shapes(input->getDimensions().nbDims, 1);
@@ -72,7 +75,8 @@ class ScaleOpConverter : public OpConverter {
        is_scale_1 = false;
      } else {
        has_scale_tensor = false;
-        scale_tensor = Add1DConstantLayer(scale);
+        scale_tensor = is_int ? Add1DConstantLayer(static_cast<int>(scale))
+                              : Add1DConstantLayer(scale);
        is_scale_1 = ((scale - 1.0) < 1e-06 && (scale - 1.0) > -1e-06);
      }

--- a/paddle/fluid/inference/tensorrt/op_teller.cc
+++ b/paddle/fluid/inference/tensorrt/op_teller.cc
@@ -1076,13 +1076,24 @@ struct SimpleOpTypeSetTeller : public Teller {
      auto* x_var_desc = block->FindVar(x_var_name);
      const auto x_shape = x_var_desc->GetShape();
      auto dtype = x_var_desc->GetDataType();
-      // At present, only support float32 or float16 into trt.
+      if (!with_dynamic_shape) {
-      if (!(dtype == 5 || dtype == 4)) {
+        // At present, only support float32 or float16 into trt.
-        return false;
+        if (!(dtype == framework::proto::VarType::FP32 ||
-      }
+              dtype == framework::proto::VarType::FP16)) {
-      if (!with_dynamic_shape && x_shape.size() == 1) {
+          return false;
-        VLOG(3) << "Scale op does not support 1-dimensional input in tensorrt";
+        }
-        return false;
+        if (x_shape.size() == 1) {
+          VLOG(3)
+              << "Scale op does not support 1-dimensional input in tensorrt";
+          return false;
+        }
+      } else {
+        // At present, only support float32 or float16 or int32 into trt.
+        if (!(dtype == framework::proto::VarType::FP32 ||
+              dtype == framework::proto::VarType::FP16 ||
+              dtype == framework::proto::VarType::INT32)) {
+          return false;
+        }
      }
    }

--- a/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py
+++ b/python/paddle/fluid/tests/unittests/ir/inference/test_trt_convert_scale.py
@@ -26,18 +26,24 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
        return True
    def sample_program_configs(self):
-        def generate_input1(attrs: List[Dict[str, Any]], batch):
+        def generate_input1(attrs: List[Dict[str, Any]], batch, is_int):
            if self.dims == 4:
-                return np.ones([batch, 3, 24, 24]).astype(np.float32)
+                return np.ones([batch, 3, 24, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
            elif self.dims == 3:
-                return np.ones([batch, 3, 24]).astype(np.float32)
+                return np.ones([batch, 3, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
            elif self.dims == 2:
-                return np.ones([batch, 24]).astype(np.float32)
+                return np.ones([batch, 24]).astype(
+                    np.int32 if is_int else np.float32
+                )
            elif self.dims == 1:
-                return np.ones([24]).astype(np.float32)
+                return np.ones([24]).astype(np.int32 if is_int else np.float32)
-        def generate_weight1(attrs: List[Dict[str, Any]]):
+        def generate_weight1(attrs: List[Dict[str, Any]], is_int):
-            return np.ones([1]).astype(np.float32)
+            return np.ones([1]).astype(np.int32 if is_int else np.float32)
        for num_input in [0, 1]:
            for dims in [1, 2, 3, 4]:
@@ -45,58 +51,67 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
                    for scale in [0.1, -1.0]:
                        for bias in [0.0, 1.2]:
                            for bias_after_scale in [False, True]:
-                                self.num_input = num_input
+                                for is_int in [False, True]:
-                                self.dims = dims
+                                    self.num_input = num_input
-                                dics = [
+                                    self.dims = dims
-                                    {
+                                    self.is_int = is_int
-                                        "scale": scale,
+                                    dics = [
-                                        "bias": bias,
+                                        {
-                                        "bias_after_scale": bias_after_scale,
+                                            "scale": scale,
-                                    },
+                                            "bias": bias,
-                                    {},
+                                            "bias_after_scale": bias_after_scale,
-                                ]
+                                        },
+                                        {},
-                                dics_intput = [
+                                    ]
-                                    {
-                                        "X": ["scale_input"],
+                                    dics_intput = [
-                                        "ScaleTensor": ["ScaleTensor"],
+                                        {
-                                    },
+                                            "X": ["scale_input"],
-                                    {"X": ["scale_input"]},
+                                            "ScaleTensor": ["ScaleTensor"],
-                                ]
+                                        },
-                                dics_intputs = [
+                                        {"X": ["scale_input"]},
-                                    {
+                                    ]
-                                        "ScaleTensor": TensorConfig(
+                                    dics_intputs = [
-                                            data_gen=partial(
+                                        {
-                                                generate_weight1, dics
+                                            "ScaleTensor": TensorConfig(
+                                                data_gen=partial(
+                                                    generate_weight1,
+                                                    dics,
+                                                    is_int,
+                                                )
                                            )
-                                        )
+                                        },
-                                    },
+                                        {},
-                                    {},
+                                    ]
-                                ]
+                                    ops_config = [
-                                ops_config = [
+                                        {
-                                    {
+                                            "op_type": "scale",
-                                        "op_type": "scale",
+                                            "op_inputs": dics_intput[num_input],
-                                        "op_inputs": dics_intput[num_input],
+                                            "op_outputs": {
-                                        "op_outputs": {"Out": ["scale_out"]},
+                                                "Out": ["scale_out"]
-                                        "op_attrs": dics[0],
+                                            },
-                                    }
+                                            "op_attrs": dics[0],
-                                ]
+                                        }
-                                ops = self.generate_op_config(ops_config)
+                                    ]
-                                program_config = ProgramConfig(
+                                    ops = self.generate_op_config(ops_config)
-                                    ops=ops,
+                                    program_config = ProgramConfig(
-                                    weights=dics_intputs[num_input],
+                                        ops=ops,
-                                    inputs={
+                                        weights=dics_intputs[num_input],
-                                        "scale_input": TensorConfig(
+                                        inputs={
-                                            data_gen=partial(
+                                            "scale_input": TensorConfig(
-                                                generate_input1, dics, batch
+                                                data_gen=partial(
+                                                    generate_input1,
+                                                    dics,
+                                                    batch,
+                                                    is_int,
+                                                )
                                            )
-                                        )
+                                        },
-                                    },
+                                        outputs=["scale_out"],
-                                    outputs=["scale_out"],
+                                    )
-                                )
-                                yield program_config
+                                    yield program_config
    def sample_predictor_configs(
        self, program_config
@@ -182,6 +197,17 @@ class TrtConvertScaleTest(TrtLayerAutoScanTest):
            "INPUT DIM EQUAL TO 1 OF STATIC SHAPE NOT SUPPORT",
        )
+        def teller3(program_config, predictor_config):
+            if self.is_int and len(self.dynamic_shape.min_input_shape) == 0:
+                return True
+            return False
+        self.add_skip_case(
+            teller3,
+            SkipReasons.TRT_NOT_SUPPORT,
+            "INTEGER INPUT OF STATIC SHAPE NOT SUPPORT",
+        )
    def test(self):
        self.add_skip_trt_case()
        self.run_test()