build(cuda): link to cuda_stub

GitOrigin-RevId: 073d3313cf961392666e331f8c116a5d0520ccc8

build(cuda): link to cuda_stub
GitOrigin-RevId: 073d3313cf961392666e331f8c116a5d0520ccc8
c9348b16 · Megvii Engine Team · 33ab2454 · c9348b16
隐藏空白更改
内联并排

Showing with 4 addition and 0 deletion

src/tensorrt/impl/tensorrt_opr.cpp src/tensorrt/impl/tensorrt_opr.cpp +4 -0

未找到文件。
--- a/src/tensorrt/impl/tensorrt_opr.cpp
+++ b/src/tensorrt/impl/tensorrt_opr.cpp
@@ -227,8 +227,10 @@ void TensorRTManager::exec(cg::SingleCNOperatorNodeBase* opr,
 #endif
        mgb_assert(exec_success, "TensorRTOpr failed in execution.");
    } else {
+#if MGB_ENABLE_JSON
        TensorRTProfiler trt_profiler;
        m_context->setProfiler(&trt_profiler);
+#endif  // MGB_ENABLE_JSON
        // TensorRT documentation stated that IExecutionContext->execute
        // "Synchronously execute inference on a batch", and it does not take a
        // cudaStream_t, we expect it do a device synchronize. But it seems like
@@ -245,8 +247,10 @@ void TensorRTManager::exec(cg::SingleCNOperatorNodeBase* opr,
        exec_success = m_context->execute(batch, m_trt_iobuf.data());
 #endif
        mgb_assert(exec_success, "trt execution failed: opr=%s", opr->cname());
+#if MGB_ENABLE_JSON
        printf("TRT profile info of opr %s:\n", opr->name().c_str());
        trt_profiler.print_layer_times();
+#endif  // MGB_ENABLE_JSON
    }
 }