From 2943aca7d54d7348733226a89b9f28cd5dafdb3d Mon Sep 17 00:00:00 2001
From: bukejiyu <52310069+bukejiyu@users.noreply.github.com>
Date: Wed, 7 Jun 2023 19:23:13 +0800
Subject: [PATCH] [inference][trt]unary, bitwise_not,one_hot op and inspector
 ci adjust for TensorRT8.6 (#54251)

* unary bitwise_not adapter tensorRT8.6 in Paddle-TensorRT

* one_hot_op ci fix

* Update test_trt_inspector.py

delete log
---
 .../inference/tensorrt/convert/unary_op.cc    |  8 ++---
 paddle/fluid/inference/tensorrt/op_teller.cc  | 18 +++++++---
 .../inference/test_trt_convert_bitwise_not.py | 34 +++++++++++++------
 test/ir/inference/test_trt_convert_one_hot.py | 32 ++++++++---------
 test/ir/inference/test_trt_convert_unary.py   | 12 +++++--
 test/ir/inference/test_trt_inspector.py       |  2 +-
 6 files changed, 67 insertions(+), 39 deletions(-)

diff --git a/paddle/fluid/inference/tensorrt/convert/unary_op.cc b/paddle/fluid/inference/tensorrt/convert/unary_op.cc
index e52cc87d750..a313fa1f711 100644
--- a/paddle/fluid/inference/tensorrt/convert/unary_op.cc
+++ b/paddle/fluid/inference/tensorrt/convert/unary_op.cc
@@ -43,7 +43,7 @@ class UnaryOpConverter : public OpConverter {
         engine_->GetITensor(op_desc.Input("X")[0]);
     auto op_pair = ops.find(op_type_);
     nvinfer1::ILayer* layer = nullptr;
-#if !IS_TRT_VERSION_GE(8500)
+
     nvinfer1::DataType org_type = input_tensor->getType();
     bool cast = org_type == nvinfer1::DataType::kINT8 ||
                 org_type == nvinfer1::DataType::kINT32;
@@ -56,19 +56,19 @@ class UnaryOpConverter : public OpConverter {
       }
       input_tensor = layer->getOutput(0);
     }
-#endif
+
     for (auto trt_op : op_pair->second) {
       layer = TRT_ENGINE_ADD_LAYER(engine_, Unary, *input_tensor, trt_op);
       input_tensor = layer->getOutput(0);
     }
-#if !IS_TRT_VERSION_GE(8500)
+
     // type restore
     if (cast) {
       layer = TRT_ENGINE_ADD_LAYER(engine_, Identity, *input_tensor);
       layer->setOutputType(0, org_type);
       input_tensor = layer->getOutput(0);
     }
-#endif
+
     auto output_name = op_desc.Output("Out")[0];
     RreplenishLayerAndOutput(layer, op_type_, {output_name}, test_mode);
   }
diff --git a/paddle/fluid/inference/tensorrt/op_teller.cc b/paddle/fluid/inference/tensorrt/op_teller.cc
index b0de399382c..826d607c4ca 100644
--- a/paddle/fluid/inference/tensorrt/op_teller.cc
+++ b/paddle/fluid/inference/tensorrt/op_teller.cc
@@ -1881,18 +1881,28 @@ struct SimpleOpTypeSetTeller : public Teller {
     }
 
     if (op_type == "bitwise_not") {
-#if !IS_TRT_VERSION_GE(8400)
       auto* block = desc.Block();
       auto x_var_name = desc.Input("X")[0];
       auto* x_var_desc = block->FindVar(x_var_name);
       auto dtype = x_var_desc->GetDataType();
-      if (dtype == framework::proto::VarType::BOOL ||
-          dtype == framework::proto::VarType::INT8 ||
+      if (dtype == framework::proto::VarType::INT8 ||
           dtype == framework::proto::VarType::UINT8) {
-        VLOG(3) << "BOOL / INT8 / UINT8 type support requires TensorRT 8.4";
+        VLOG(3) << "INT8 / UINT8 type convert to trt is not supported";
         return false;
       }
+      if (dtype == framework::proto::VarType::BOOL) {
+#if !IS_TRT_VERSION_GE(8400)
+        VLOG(3) << "BOOL type support requires TensorRT 8.4";
+        return false;
+#elif !IS_TRT_VERSION_GE(8600)
+        const auto x_shape = x_var_desc->GetShape();
+        if (x_shape.size() == 0) {
+          VLOG(3)
+              << "BOOL type does not support 0 dim input when TensorRT < 8.6.";
+          return false;
+        }
 #endif
+      }
     }
 
     if (op_type == "one_hot" || op_type == "one_hot_v2") {
diff --git a/test/ir/inference/test_trt_convert_bitwise_not.py b/test/ir/inference/test_trt_convert_bitwise_not.py
index 49f00b52237..ab8da867362 100644
--- a/test/ir/inference/test_trt_convert_bitwise_not.py
+++ b/test/ir/inference/test_trt_convert_bitwise_not.py
@@ -31,7 +31,9 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
         self.trt_param.workspace_size = 1073741824
 
         def generate_input1(dims, batch, attrs: List[Dict[str, Any]]):
-            if dims == 1:
+            if dims == 0:
+                return np.random.random([]).astype(np.bool8)
+            elif dims == 1:
                 return np.random.random([32]).astype(np.bool8)
             elif dims == 2:
                 return np.random.random([3, 32]).astype(np.int8)
@@ -40,7 +42,7 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
             else:
                 return np.random.random([batch, 3, 32, 32]).astype(np.int64)
 
-        for dims in [1, 2, 3, 4]:
+        for dims in [0, 1, 2, 3, 4]:
             for batch in [1, 4]:
                 self.dims = dims
                 dics = [{}]
@@ -65,13 +67,20 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
                     },
                     outputs=["output_data"],
                 )
+                program_config.input_type = program_config.inputs[
+                    'input_data'
+                ].dtype
                 yield program_config
 
     def sample_predictor_configs(
         self, program_config
     ) -> (paddle_infer.Config, List[int], float):
         def generate_dynamic_shape(attrs):
-            if self.dims == 1:
+            if self.dims == 0:
+                self.dynamic_shape.min_input_shape = {"input_data": []}
+                self.dynamic_shape.max_input_shape = {"input_data": []}
+                self.dynamic_shape.opt_input_shape = {"input_data": []}
+            elif self.dims == 1:
                 self.dynamic_shape.min_input_shape = {"input_data": [1]}
                 self.dynamic_shape.max_input_shape = {"input_data": [64]}
                 self.dynamic_shape.opt_input_shape = {"input_data": [32]}
@@ -102,16 +111,19 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
         def generate_trt_nodes_num(attrs, dynamic_shape):
             ver = paddle_infer.get_trt_compile_version()
             trt_version = ver[0] * 1000 + ver[1] * 100 + ver[2] * 10
-            if trt_version >= 8400:
-                if self.dims == 1:
+            if not dynamic_shape:
+                if self.dims == 1 or self.dims == 0:
                     return 0, 3
-                return 1, 2
-            else:
-                if self.dims <= 2 or (
-                    program_config.inputs['input_data'].dtype
-                    in ['bool', 'int8', 'uint8']
-                ):
+            if program_config.input_type in ['int8', 'uint8']:
+                return 0, 3
+            elif program_config.input_type == 'bool':
+                if trt_version <= 8600 and self.dims == 0:
                     return 0, 3
+                elif trt_version <= 8400:
+                    return 0, 3
+                else:
+                    return 1, 2
+            else:
                 return 1, 2
 
         attrs = [
diff --git a/test/ir/inference/test_trt_convert_one_hot.py b/test/ir/inference/test_trt_convert_one_hot.py
index 30446265a43..5332cb950ae 100644
--- a/test/ir/inference/test_trt_convert_one_hot.py
+++ b/test/ir/inference/test_trt_convert_one_hot.py
@@ -52,10 +52,10 @@ class TrtConvertOneHotTest(TrtLayerAutoScanTest):
                 dics = [{"dtype": 5, "depth": 10}, {}]
                 ops_config = [
                     {
-                        "op_type": "one_hot",
+                        "op_type": "one_hot_v2",
                         "op_inputs": {
-                            "X": ["input_x_data"],
-                            "depth_tensor": ["input_depth_data"],
+                            "X": ["indices_tensor"],
+                            "depth_tensor": ["depth_tensor_data"],
                         },
                         "op_outputs": {"Out": ["output_data"]},
                         "op_attrs": dics[0],
@@ -67,7 +67,7 @@ class TrtConvertOneHotTest(TrtLayerAutoScanTest):
                 program_config = ProgramConfig(
                     ops=ops,
                     weights={
-                        "depth_tensor": TensorConfig(
+                        "depth_tensor_data": TensorConfig(
                             data_gen=partial(generate_depth, dims, batch)
                         ),
                     },
@@ -87,43 +87,43 @@ class TrtConvertOneHotTest(TrtLayerAutoScanTest):
         def generate_dynamic_shape(attrs):
             if self.dims == 1:
                 self.dynamic_shape.min_input_shape = {
-                    "input_x_data": [1],
+                    "indices_tensor": [1],
                 }
                 self.dynamic_shape.max_input_shape = {
-                    "input_x_data": [2],
+                    "indices_tensor": [2],
                 }
                 self.dynamic_shape.opt_input_shape = {
-                    "input_x_data": [1],
+                    "indices_tensor": [1],
                 }
             elif self.dims == 2:
                 self.dynamic_shape.min_input_shape = {
-                    "input_x_data": [1, 4],
+                    "indices_tensor": [1, 4],
                 }
                 self.dynamic_shape.max_input_shape = {
-                    "input_x_data": [2, 4],
+                    "indices_tensor": [2, 4],
                 }
                 self.dynamic_shape.opt_input_shape = {
-                    "input_x_data": [1, 4],
+                    "indices_tensor": [1, 4],
                 }
             elif self.dims == 3:
                 self.dynamic_shape.min_input_shape = {
-                    "input_x_data": [1, 4, 6],
+                    "indices_tensor": [1, 4, 6],
                 }
                 self.dynamic_shape.max_input_shape = {
-                    "input_x_data": [2, 4, 6],
+                    "indices_tensor": [2, 4, 6],
                 }
                 self.dynamic_shape.opt_input_shape = {
-                    "input_x_data": [1, 4, 6],
+                    "indices_tensor": [1, 4, 6],
                 }
             elif self.dims == 4:
                 self.dynamic_shape.min_input_shape = {
-                    "input_x_data": [1, 4, 6, 8],
+                    "indices_tensor": [1, 4, 6, 8],
                 }
                 self.dynamic_shape.max_input_shape = {
-                    "input_x_data": [2, 4, 6, 8],
+                    "indices_tensor": [2, 4, 6, 8],
                 }
                 self.dynamic_shape.opt_input_shape = {
-                    "input_x_data": [1, 4, 6, 8],
+                    "indices_tensor": [1, 4, 6, 8],
                 }
 
         def clear_dynamic_shape():
diff --git a/test/ir/inference/test_trt_convert_unary.py b/test/ir/inference/test_trt_convert_unary.py
index 322130c83f5..1d83978f2f0 100644
--- a/test/ir/inference/test_trt_convert_unary.py
+++ b/test/ir/inference/test_trt_convert_unary.py
@@ -37,7 +37,7 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
         def generate_input1(dims, batch, attrs: List[Dict[str, Any]]):
             if dims == 0:
                 return np.random.random([]).astype(np.float32)
-            if dims == 2:
+            elif dims == 2:
                 return np.random.random([3, 32]).astype(np.float32)
             elif dims == 3:
                 return np.random.random([3, 32, 32]).astype(np.float32)
@@ -47,7 +47,7 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
         def generate_int_input(dims, batch, attrs: List[Dict[str, Any]]):
             if dims == 0:
                 return np.random.random([]).astype(np.int32)
-            if dims == 2:
+            elif dims == 2:
                 return np.random.random([3, 32]).astype(np.int32)
             elif dims == 3:
                 return np.random.random([3, 32, 32]).astype(np.int32)
@@ -146,7 +146,11 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
         self, program_config
     ) -> (paddle_infer.Config, List[int], float):
         def generate_dynamic_shape(attrs):
-            if self.dims == 1:
+            if self.dims == 0:
+                self.dynamic_shape.min_input_shape = {"input_data": []}
+                self.dynamic_shape.max_input_shape = {"input_data": []}
+                self.dynamic_shape.opt_input_shape = {"input_data": []}
+            elif self.dims == 1:
                 self.dynamic_shape.min_input_shape = {"input_data": [1]}
                 self.dynamic_shape.max_input_shape = {"input_data": [64]}
                 self.dynamic_shape.opt_input_shape = {"input_data": [32]}
@@ -193,6 +197,8 @@ class TrtConvertActivationTest(TrtLayerAutoScanTest):
                 and self.dims == 0
             ):
                 return 0, 3
+            if not dynamic_shape and (self == 1 or self.dims == 0):
+                return 0, 3
             return 1, 2
 
         attrs = [
diff --git a/test/ir/inference/test_trt_inspector.py b/test/ir/inference/test_trt_inspector.py
index 7985e8f1374..a1bb1579891 100644
--- a/test/ir/inference/test_trt_inspector.py
+++ b/test/ir/inference/test_trt_inspector.py
@@ -72,7 +72,7 @@ class TensorRTInspectorTest(InferencePassTest):
                 self.assertTrue('====== engine info ======' in engine_info)
                 self.assertTrue('====== engine info end ======' in engine_info)
                 self.assertTrue('matmul' in engine_info)
-                self.assertTrue('LayerType: Scale' in engine_info)
+                self.assertTrue('"LayerType": "Scale"' in engine_info)
                 self.assertTrue('batch_norm' in engine_info)
             else:
                 self.assertTrue(
-- 
GitLab