From abe3c165ba494656626cbc141361c896f9243640 Mon Sep 17 00:00:00 2001
From: Megvii Engine Team <megengine@megvii.com>
Date: Thu, 14 Jan 2021 14:02:57 +0800
Subject: [PATCH] feat(mge): tensorrt runtime opr

GitOrigin-RevId: 2fdd00adcbbe272e79d53ba0ac879d2eedf471d0
---
 .gitattributes                                |  2 +-
 .../python/megengine/functional/external.py   | 22 +++++++++++
 .../python/megengine/module/external.py       | 37 +++++++++++++++++++
 .../python/test/unit/module/test_external.py  |  8 ++++
 imperative/src/impl/ops/tensorrt_runtime.cpp  | 32 ++++++++++++++++
 src/core/include/megbrain/ir/ops.td           |  7 ++++
 6 files changed, 107 insertions(+), 1 deletion(-)
 create mode 100644 imperative/python/megengine/functional/external.py
 create mode 100644 imperative/python/megengine/module/external.py
 create mode 100644 imperative/src/impl/ops/tensorrt_runtime.cpp

diff --git a/.gitattributes b/.gitattributes
index b57774eb5..84691370d 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -5,4 +5,4 @@ dnn/src/cuda/conv_bias/int8_imma/kimpl/* binary
 dnn/src/cuda/batch_conv_bias/int8/kimpl/* binary
 dnn/src/cuda/sass/prebuilt/map_defs.cpp binary
 tools/mlir/mlir-tblgen filter=lfs diff=lfs merge=lfs -text
-sdk/c-opr-loaders/mc40/example/sinopec_nv12_extra.neu filter=lfs diff=lfs merge=lfs -text
+*.caffemodel filter=lfs diff=lfs merge=lfs -text
diff --git a/imperative/python/megengine/functional/external.py b/imperative/python/megengine/functional/external.py
new file mode 100644
index 000000000..c1e6373f6
--- /dev/null
+++ b/imperative/python/megengine/functional/external.py
@@ -0,0 +1,22 @@
+# -*- coding: utf-8 -*-
+# MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
+#
+# Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# pylint: disable=redefined-builtin
+from typing import Sequence
+
+from ..core._imperative_rt.core2 import apply
+from ..core.ops import builtin
+
+
+def tensorrt_runtime_opr(inputs, *, data: bytes = None):
+    # empty model will give None result
+    if data is None:
+        return None
+    op = builtin.TensorRTRuntime(data, len(data))
+    # return sequence of outputs
+    return apply(op, *inputs)
diff --git a/imperative/python/megengine/module/external.py b/imperative/python/megengine/module/external.py
new file mode 100644
index 000000000..ae98c8c4f
--- /dev/null
+++ b/imperative/python/megengine/module/external.py
@@ -0,0 +1,37 @@
+# -*- coding: utf-8 -*-
+# MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
+#
+# Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# pylint: disable=redefined-builtin
+import numpy as np
+
+from ..functional.external import tensorrt_runtime_opr
+from .module import Module
+
+
+class TensorrtRuntimeSubgraph(Module):
+    r"""Load a serialized TensorrtRuntime subgraph.
+
+    See :func:`~.tensorrt_runtime_opr` for more details.
+    """
+
+    def __init__(
+        self, data,
+    ):
+        super(TensorrtRuntimeSubgraph, self).__init__()
+        self._data = data
+
+    @property
+    def data(self):
+        return self._data
+
+    @data.setter
+    def data(self, val):
+        self._data = np.frombuffer(val, dtype=np.uint8)
+
+    def forward(self, *inputs):
+        return tensorrt_runtime_opr(inputs, data=self._data)
diff --git a/imperative/python/test/unit/module/test_external.py b/imperative/python/test/unit/module/test_external.py
index cab28c457..a39ea4a58 100644
--- a/imperative/python/test/unit/module/test_external.py
+++ b/imperative/python/test/unit/module/test_external.py
@@ -6,14 +6,20 @@
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+import io
 import os
+import platform
 
 import numpy as np
 import pytest
 
 import megengine as mge
+import megengine.utils.comp_graph_tools as cgtools
 from megengine import Tensor
+from megengine.distributed.helper import get_device_count_by_fork
+from megengine.jit import trace
 from megengine.module import Module
+from megengine.module.external import TensorrtRuntimeSubgraph
 
 
 class MyModule(Module):
@@ -44,3 +50,5 @@ def test_cambricon_module():
             return pred
 
         pred = inference([inp])
+
+
diff --git a/imperative/src/impl/ops/tensorrt_runtime.cpp b/imperative/src/impl/ops/tensorrt_runtime.cpp
new file mode 100644
index 000000000..a5eef4591
--- /dev/null
+++ b/imperative/src/impl/ops/tensorrt_runtime.cpp
@@ -0,0 +1,32 @@
+/**
+ * \file imperative/src/impl/ops/tensorrt_runtime.cpp
+ * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
+ *
+ * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ */
+#include "../op_trait.h"
+#include "megbrain/imperative/ops/autogen.h"
+
+#if MGB_ENABLE_TENSOR_RT
+#include "megbrain/tensorrt/tensorrt_runtime_opr.h"
+namespace mgb::imperative {
+
+namespace { namespace tensorrt_runtime {
+    auto apply_on_var_node(
+            const OpDef& def,
+            const VarNodeArray& inputs) {
+        auto&& op = static_cast<const TensorRTRuntime&>(def);
+        SymbolVarArray sinputs(inputs.begin(), inputs.end());
+        return opr::TensorRTRuntimeOpr::make(op.buf.c_str(), op.buf_size, sinputs);
+    }
+OP_TRAIT_REG(TensorRTRuntime, TensorRTRuntime)
+    .apply_on_var_node(apply_on_var_node)
+    .fallback();
+}} // tensorrt_runtime
+
+} // namespace mgb::imperative
+#endif  // MGB_ENABLE_TENSOR_RT
diff --git a/src/core/include/megbrain/ir/ops.td b/src/core/include/megbrain/ir/ops.td
index 7f06a49ac..7ac9f0493 100644
--- a/src/core/include/megbrain/ir/ops.td
+++ b/src/core/include/megbrain/ir/ops.td
@@ -241,4 +241,11 @@ def ElemwiseMultiType: MgbHashableOp<"ElemwiseMultiType", [ElemwiseMultiTypePara
 
 def InplaceAdd: MgbHashableOp<"InplaceAdd", [EmptyParam]>;
 
+def TensorRTRuntime: MgbHashableOp<"TensorRTRuntime"> {
+  let extraArguments = (ins
+    MgbStringAttr:$buf,
+    MgbSizeTAddr:$buf_size
+  );
+}
+
 #endif // MGB_OPS
-- 
GitLab