// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/infrt/api/infrt_api.h" #include #include #include #include #include #include #include "paddle/infrt/common/global.h" #include "paddle/infrt/dialect/dense_tensor.h" #include "paddle/infrt/dialect/infrt/infrt_dialect.h" #include "paddle/infrt/dialect/mlir_loader.h" #include "paddle/infrt/host_context/core_runtime.h" #include "paddle/infrt/host_context/kernel_registry.h" #include "paddle/infrt/host_context/mlir_function_executable.h" #include "paddle/infrt/host_context/mlir_to_runtime_translate.h" #include "paddle/infrt/host_context/op_executable.h" #include "paddle/infrt/host_context/value.h" #include "paddle/infrt/kernel/basic_kernels.h" #include "paddle/infrt/kernel/control_flow_kernels.h" #include "paddle/infrt/kernel/tensor_kernels.h" #include "paddle/infrt/kernel/tensor_shape_kernels.h" #include "paddle/infrt/kernel/test_kernels.h" #include "paddle/infrt/tensor/tensor_map.h" using namespace infrt::host_context; // NOLINT using namespace infrt::tensor; // NOLINT using namespace infrt::tensor; // NOLINT namespace infrt { template std::string DumpToString(T& op) { // NOLINT std::string buffer; llvm::raw_string_ostream os(buffer); op.print(os); os.flush(); return buffer; } struct MlirToRuntimeTranslator::Impl { mlir::ModuleOp module; // The runtime for a function call. CoreRuntimeBuilder* runtime{}; // The current working op, the translator process the ops one by one, each // time it updates `cur_op` here to current op // working on. OpExecutableBuilder* cur_op{}; // record the current function name. std::string cur_func_name; // Name to function definitions. std::unordered_map func_defs; // Map from an operation to its results. std::unordered_map> op_results; llvm::DenseMap value_map; }; /** * Execute the mlir program in predict mode. */ class PredictExecutor : public MlirToRuntimeTranslator { public: CoreRuntimeBuilder core_runtime; PredictExecutor(mlir::ModuleOp module, KernelRegistry* registry, TensorMap* map) : MlirToRuntimeTranslator(module, &core_runtime), core_runtime(registry), registry_(registry) { CHECK(registry_); Init(map); } void Run() { auto arguments = llvm::makeArrayRef(arguments_); auto results = llvm::makeMutableArrayRef(results_.begin(), results_.size()); function_executable_->Execute(arguments, results); } int GetInputNum() { return inputs_.size(); } DenseHostTensor* GetInput(int i) { return inputs_[i]; } int GetOutputNum() { return outputs_.size(); } DenseHostTensor* GetOutput(int i) { return outputs_[i]; } private: void Init(TensorMap* map) { EmitFunctions(); llvm::Optional predict_func_ = llvm::None; for (auto func_op : impl_->module.getOps()) { if (func_op.getName().str() != "predict") continue; predict_func_ = func_op; break; } if (!predict_func_) { std::cout << "ERROR: init failed, no predict function found in mlir." << std::endl; return; } auto& predict_func = predict_func_.getValue(); function_executable_ = new MlirFunctionExecutable(predict_func, registry_, impl_->func_defs); // process parammeters for (size_t i = 0; i < predict_func.getNumArguments(); ++i) { auto arg = predict_func.getArgument(i); auto type = arg.getType(); // this param is TensorMap if (type.isa()) { auto* value = new host_context::Value(std::move(*map)); arguments_.push_back(value); AddValue(predict_func.getArgument(i), value); } else { // this param is an input Tensor auto dht = DenseHostTensor(); auto* value = new host_context::Value(std::move(dht)); arguments_.push_back(value); inputs_.push_back(&(value->get())); } } // process results auto& last_op = predict_func.front().back(); if (last_op.getName().getStringRef() == "Infrt.return") { for (size_t i = 0; i < last_op.getNumOperands(); ++i) { auto* value = AddValue(mlir::Value(last_op.getOperand(i))); results_.push_back(ValueRef(value)); outputs_.push_back(&(value->get())); } } } protected: std::unordered_map func_def_table; void EmitFunction(mlir::FuncOp op) override { CHECK(!impl_->func_defs.count(op.getName().str())) << "Duplicate function defition found for function [" << op.getName().str(); impl_->func_defs.emplace(op.getName().str(), op); } private: KernelRegistry* registry_{}; MlirFunctionExecutable* function_executable_; llvm::SmallVector inputs_; llvm::SmallVector arguments_; llvm::SmallVector outputs_; llvm::SmallVector results_; }; std::shared_ptr CreateInfRtPredictor( const InfRtConfig& config) { auto x = std::make_shared(); x->Init(config); return x; } struct InfRtPredictor::Impl { mlir::OwningModuleRef module_ref; std::unique_ptr executor; }; InfRtPredictor::InfRtPredictor() : impl_(new Impl) {} InfRtPredictor::~InfRtPredictor() {} void InfRtPredictor::Run() { impl_->executor->Run(); } int InfRtPredictor::Init(const InfRtConfig& config) { mlir::MLIRContext* context = infrt::Global::getMLIRContext(); auto module_ref = dialect::LoadMlirFile(config.mlir_path(), context); KernelRegistry* registry = new KernelRegistry(); kernel::RegisterBasicKernels(registry); kernel::RegisterTestKernels(registry); kernel::RegisterTensorShapeKernels(registry); kernel::RegisterTensorKernels(registry); kernel::RegisterControlFlowKernels(registry); impl_->module_ref = std::move(module_ref); // load extra shared library for (const std::string& lib_path : config.shared_libs()) { std::string err; llvm::sys::DynamicLibrary dynLib = llvm::sys::DynamicLibrary::getPermanentLibrary(lib_path.c_str(), &err); if (!dynLib.isValid()) { llvm::errs() << "Load shared library failed. Error: " << err << "\n"; return 1; } if (auto reg_sym = dynLib.SearchForAddressOfSymbol("RegisterKernels")) { auto reg_func = reinterpret_cast(reg_sym); reg_func(registry); } else { llvm::outs() << "Symbol \"RegisterKernels\" not found in \"" << lib_path << "\". Skip.\n"; } } // Load params TensorMap* tensor_map = LoadParams(config.model_dir()); // Create PredictExecutor impl_->executor.reset( new PredictExecutor(impl_->module_ref.get(), registry, tensor_map)); return 0; } int InfRtPredictor::GetInputNum() { return impl_->executor->GetInputNum(); } DenseHostTensor* InfRtPredictor::GetInput(int i) { return impl_->executor->GetInput(i); } int InfRtPredictor::GetOutputNum() { return impl_->executor->GetOutputNum(); } DenseHostTensor* InfRtPredictor::GetOutput(int i) { return impl_->executor->GetOutput(i); } } // namespace infrt