diff --git a/lite/load_and_run/src/helpers/common.h b/lite/load_and_run/src/helpers/common.h index 909f1104bdc3054ed20811ebb7db8b54a3780e5b..65481090be2bf8f62e8d6822ee120f7449b6aabd 100644 --- a/lite/load_and_run/src/helpers/common.h +++ b/lite/load_and_run/src/helpers/common.h @@ -11,27 +11,29 @@ enum class RunStage { BEFORE_MODEL_LOAD = 0, - AFTER_MODEL_LOAD = 1, + AFTER_NETWORK_CREATED = 1, - BEFORE_OUTSPEC_SET = 2, + AFTER_MODEL_LOAD = 2, + + BEFORE_OUTSPEC_SET = 3, //! using for dump static memory information svg file - AFTER_OUTSPEC_SET = 3, + AFTER_OUTSPEC_SET = 4, //! using for external c opr library - MODEL_RUNNING = 4, + MODEL_RUNNING = 5, //! using for output dumper - AFTER_RUNNING_WAIT = 5, + AFTER_RUNNING_WAIT = 6, //! using for external c opr library - AFTER_RUNNING_ITER = 6, + AFTER_RUNNING_ITER = 7, - AFTER_MODEL_RUNNING = 7, + AFTER_MODEL_RUNNING = 8, - GLOBAL_OPTIMIZATION = 8, + GLOBAL_OPTIMIZATION = 9, - UPDATE_IO = 9, + UPDATE_IO = 10, }; /*! * \brief: type of different model diff --git a/lite/load_and_run/src/models/model.h b/lite/load_and_run/src/models/model.h index 2e6f9b57732708ea3acd7eefbbdd45caa4ad2513..d1a017754440c3441d71c91ebdca9694f32e7991 100644 --- a/lite/load_and_run/src/models/model.h +++ b/lite/load_and_run/src/models/model.h @@ -24,6 +24,8 @@ public: virtual void set_shared_mem(bool state) = 0; + virtual void create_network(){}; + //! load model interface for load and run strategy virtual void load_model() = 0; diff --git a/lite/load_and_run/src/models/model_lite.cpp b/lite/load_and_run/src/models/model_lite.cpp index 71cba92188352837f634cca9b913536805d89d51..1f075a733e65dc0c57dbd004b0970c3e2af74c46 100644 --- a/lite/load_and_run/src/models/model_lite.cpp +++ b/lite/load_and_run/src/models/model_lite.cpp @@ -10,12 +10,12 @@ using namespace lar; ModelLite::ModelLite(const std::string& path) : model_path(path) { LITE_LOG("creat lite model use CPU as default comp node"); }; -void ModelLite::load_model() { + +void ModelLite::create_network() { m_network = std::make_shared(config, IO); - if (enable_layout_transform) { - LITE_LOG("enable layout transform while load model for lite"); - lite::Runtime::enable_global_layout_transform(m_network); - } +} + +void ModelLite::load_model() { if (share_model_mem) { //! WARNNING:maybe not right to share param memmory for this LITE_LOG("enable share model memory"); @@ -116,4 +116,4 @@ std::vector ModelLite::get_model_data() { LITE_THROW("unsupported interface: ModelLite::get_model_data() \n"); return out_data; -} \ No newline at end of file +} diff --git a/lite/load_and_run/src/models/model_lite.h b/lite/load_and_run/src/models/model_lite.h index 1df00b29c52bffe4951b2027558eae7eeb174596..521c9ff049bb361e69a180afa29664af44299c40 100644 --- a/lite/load_and_run/src/models/model_lite.h +++ b/lite/load_and_run/src/models/model_lite.h @@ -21,6 +21,9 @@ public: //! set to load from shared memory void set_shared_mem(bool state) override { share_model_mem = state; } + //! load model from dump file + void create_network() override; + //! load model from dump file void load_model() override; @@ -34,9 +37,6 @@ public: std::shared_ptr get_io_info() override; #endif - //! enable global layout transform - void set_layout_transform(bool state) { enable_layout_transform = state; } - //! get the network of lite model std::shared_ptr& get_lite_network() { return m_network; } @@ -61,7 +61,6 @@ public: private: bool share_model_mem = false; - bool enable_layout_transform = false; std::string model_path; DataParser parser; diff --git a/lite/load_and_run/src/options/fastrun_options.cpp b/lite/load_and_run/src/options/fastrun_options.cpp index ec5d0500216ff434dcd6d668e27022e68bd43839..8875a815dd74b8e4b060727da1fa1cbce075f46a 100644 --- a/lite/load_and_run/src/options/fastrun_options.cpp +++ b/lite/load_and_run/src/options/fastrun_options.cpp @@ -19,7 +19,7 @@ namespace lar { template <> void FastRunOption::config_model_internel( RuntimeParam& runtime_param, std::shared_ptr model) { - if (runtime_param.stage == RunStage::BEFORE_MODEL_LOAD) { + if (runtime_param.stage == RunStage::AFTER_NETWORK_CREATED) { //! set the algo policy before model load using Strategy = ModelLite::Strategy; uint32_t strategy = 0; @@ -44,23 +44,17 @@ void FastRunOption::config_model_internel( strategy; } auto lite_strategy = static_cast(strategy); - model->set_lite_strategy(lite_strategy); - } else if (runtime_param.stage == RunStage::AFTER_MODEL_LOAD) { - auto&& lite_network = model->get_lite_network(); - auto&& lite_strategy = model->get_lite_strategy(); //! set algo policy for model + auto&& lite_network = model->get_lite_network(); lite::Runtime::set_network_algo_policy( lite_network, lite_strategy, share_batch_size, batch_binary_equal); + } else if (runtime_param.stage == RunStage::AFTER_MODEL_LOAD) { if (!m_fast_run_cache.empty()) { if (!access(m_fast_run_cache.c_str(), F_OK)) { lite::set_persistent_cache(m_fast_run_cache); } else { lite::set_persistent_cache(m_fast_run_cache, true); } - //! TODO:this is from mdl model settings but not matched settings in - //! lite model - // if (!enable_full_run && !enable_fast_run) - // mgb::gopt::enable_opr_use_profiling_cache_inplace(vars); } } else if (runtime_param.stage == RunStage::AFTER_MODEL_RUNNING) { #if MGB_ENABLE_FASTRUN @@ -255,4 +249,4 @@ DEFINE_int32(fast_run_shared_batch_size, 0, "Set the batch size used during fast DEFINE_string(fast_run_algo_policy, "", "fast-run cache path."); REGIST_OPTION_CREATOR(fastrun, lar::FastRunOption::create_option); -REGIST_OPTION_VALIDATER(fastrun, lar::FastRunOption::set_valid); \ No newline at end of file +REGIST_OPTION_VALIDATER(fastrun, lar::FastRunOption::set_valid); diff --git a/lite/load_and_run/src/options/layout_trans_options.cpp b/lite/load_and_run/src/options/layout_trans_options.cpp index e933a9623cefe4411874c8c221970c838669f1c1..6c5d6d32ccb792aab11d62e2e5b65e1482737793 100644 --- a/lite/load_and_run/src/options/layout_trans_options.cpp +++ b/lite/load_and_run/src/options/layout_trans_options.cpp @@ -9,7 +9,7 @@ namespace lar { template <> void GoptLayoutOption::config_model_internel( RuntimeParam& runtime_param, std::shared_ptr model) { - if (runtime_param.stage == RunStage::BEFORE_MODEL_LOAD) { + if (runtime_param.stage == RunStage::AFTER_NETWORK_CREATED) { if (m_layout_transform) { LITE_LOG("using global layout transform optimization\n"); if (m_layout_transform_target == @@ -23,7 +23,9 @@ void GoptLayoutOption::config_model_internel( model->get_config().device_type = LiteDeviceType::LITE_CUDA; } #endif - model->set_layout_transform(true); + LITE_LOG("enable layout transform while load model for lite"); + auto&& lite_network = model->get_lite_network(); + lite::Runtime::enable_global_layout_transform(lite_network); } } else if (runtime_param.stage == RunStage::GLOBAL_OPTIMIZATION) { if (m_layout_transform) { @@ -266,4 +268,4 @@ DEFINE_int32( layout_transform_batch_size, -1, "the batch size of input for global layout transform optimization working on"); REGIST_OPTION_CREATOR(gopt_layout, lar::GoptLayoutOption::create_option); -REGIST_OPTION_VALIDATER(gopt_layout, lar::GoptLayoutOption::set_valid); \ No newline at end of file +REGIST_OPTION_VALIDATER(gopt_layout, lar::GoptLayoutOption::set_valid); diff --git a/lite/load_and_run/src/strategys/strategy_fitting.cpp b/lite/load_and_run/src/strategys/strategy_fitting.cpp index 630afc2de8125aad9a6aa00b00d050a2a96601c0..5f7754e66a2ad82ee382d9acaf76c0fe1927fef9 100644 --- a/lite/load_and_run/src/strategys/strategy_fitting.cpp +++ b/lite/load_and_run/src/strategys/strategy_fitting.cpp @@ -197,6 +197,10 @@ void OptionsTimeProfiler::profile_with_given_options( runtime_param.stage = RunStage::BEFORE_MODEL_LOAD; stage_config_model(); + runtime_param.stage = RunStage::AFTER_NETWORK_CREATED; + model->create_network(); + stage_config_model(); + model->load_model(); //! after load configure auto config_model_before_runing = [&]() { diff --git a/lite/load_and_run/src/strategys/strategy_normal.cpp b/lite/load_and_run/src/strategys/strategy_normal.cpp index 376b4959d2d7dd622b0294e47996d9a1812cf440..37bf037c0f97532986ecb3f53bdccb8136b7cd90 100644 --- a/lite/load_and_run/src/strategys/strategy_normal.cpp +++ b/lite/load_and_run/src/strategys/strategy_normal.cpp @@ -42,6 +42,10 @@ void NormalStrategy::run_subline() { m_runtime_param.stage = RunStage::BEFORE_MODEL_LOAD; stage_config_model(); + m_runtime_param.stage = RunStage::AFTER_NETWORK_CREATED; + model->create_network(); + stage_config_model(); + mgb::RealTimer timer; model->load_model(); mgb_log("load model: %.3fms\n", timer.get_msecs_reset()); diff --git a/lite/test/test_layout_options.cpp b/lite/test/test_layout_options.cpp index 1ef8402dd5073d92299ba87607fe5eff8e09d892..987a252d99756dce5be7d6fe85536b92478fce86 100644 --- a/lite/test/test_layout_options.cpp +++ b/lite/test/test_layout_options.cpp @@ -18,6 +18,7 @@ DECLARE_bool(enable_nchw32); DECLARE_bool(enable_nchw64); DECLARE_bool(enable_nhwcd4); DECLARE_bool(enable_nchw44_dot); +DECLARE_bool(fast_run); namespace { BOOL_OPTION_WRAP(enable_nchw4); BOOL_OPTION_WRAP(enable_chwn4); @@ -27,6 +28,7 @@ BOOL_OPTION_WRAP(enable_nchw32); BOOL_OPTION_WRAP(enable_nchw64); BOOL_OPTION_WRAP(enable_nhwcd4); BOOL_OPTION_WRAP(enable_nchw44_dot); +BOOL_OPTION_WRAP(fast_run); BOOL_OPTION_WRAP(lite); BOOL_OPTION_WRAP(cpu); @@ -60,6 +62,17 @@ TEST(TestLarLayout, X86_CPU_LITE) { TEST_BOOL_OPTION(enable_nchw32); TEST_BOOL_OPTION(enable_nchw88); } + +TEST(TestLarLayoutFastRun, CPU_LITE) { + DEFINE_WRAP(cpu); + DEFINE_WRAP(lite); + std::string model_path = "./shufflenet.mge"; + { + DEFINE_WRAP(enable_nchw44); + DEFINE_WRAP(fast_run); + run_NormalStrategy(model_path); + } +} #if LITE_WITH_CUDA TEST(TestLarLayout, CUDA) { DEFINE_WRAP(cuda); diff --git a/lite/test/test_options.h b/lite/test/test_options.h index e91bdf9dfe34a7c0db3ff23449c9c679012e5961..81f8be47facb743f433b09221d4863c107ab9360 100644 --- a/lite/test/test_options.h +++ b/lite/test/test_options.h @@ -25,9 +25,9 @@ void run_NormalStrategy(std::string model_path); #define DEFINE_WRAP(option) BoolOptionWrap_##option flags_##option; -#define TEST_BOOL_OPTION(option) \ - { \ - BoolOptionWrap_##option flags_##option; \ - run_NormalStrategy(model_path); \ +#define TEST_BOOL_OPTION(option) \ + { \ + DEFINE_WRAP(option); \ + run_NormalStrategy(model_path); \ } // vim: syntax=cpp.doxygen foldmethod=marker foldmarker=f{{{,f}}}