From d714bf037c4dbc2f5626442728179257449755b8 Mon Sep 17 00:00:00 2001 From: guru4elephant <35550832+guru4elephant@users.noreply.github.com> Date: Wed, 17 Jul 2019 22:55:49 +0800 Subject: [PATCH] remove async executor and add data_feed.proto to the deps of train demo (#18659) * remove async executor and add data_feed.proto to the deps of train demo --- AUTHORS.md | 1 + cmake/inference_lib.cmake | 7 ++- paddle/fluid/framework/CMakeLists.txt | 15 +---- paddle/fluid/framework/data_feed.cc | 11 ++-- paddle/fluid/framework/data_feed.h | 4 +- paddle/fluid/framework/data_set.cc | 1 + paddle/fluid/inference/CMakeLists.txt | 2 +- paddle/fluid/pybind/CMakeLists.txt | 3 +- paddle/fluid/pybind/async_executor_py.cc | 72 ------------------------ paddle/fluid/pybind/async_executor_py.h | 28 --------- paddle/fluid/pybind/pybind.cc | 2 - paddle/fluid/train/demo/CMakeLists.txt | 2 +- 12 files changed, 16 insertions(+), 132 deletions(-) delete mode 100644 paddle/fluid/pybind/async_executor_py.cc delete mode 100644 paddle/fluid/pybind/async_executor_py.h diff --git a/AUTHORS.md b/AUTHORS.md index da91933f46..d99a613c85 100644 --- a/AUTHORS.md +++ b/AUTHORS.md @@ -14,6 +14,7 @@ | emailweixu | Wei Xu | | gangliao | Gang Liao | | gongweibao | Wei-Bao Gong | +| guru4elephant | Daxiang Dong | | Guo Sheng | Sheng Guo | | Haichao-Zhang | Hai-Chao Zhang | | hedaoyuan | Dao-Yuan He | diff --git a/cmake/inference_lib.cmake b/cmake/inference_lib.cmake index 885103a7e9..2a3962b92b 100644 --- a/cmake/inference_lib.cmake +++ b/cmake/inference_lib.cmake @@ -192,10 +192,11 @@ set(module "framework") if (NOT WIN32) set(framework_lib_deps framework_py_proto) endif (NOT WIN32) + copy(framework_lib DEPS ${framework_lib_deps} - SRCS ${src_dir}/${module}/*.h ${src_dir}/${module}/details/*.h ${PADDLE_BINARY_DIR}/paddle/fluid/framework/framework.pb.h - ${src_dir}/${module}/ir/*.h - DSTS ${dst_dir}/${module} ${dst_dir}/${module}/details ${dst_dir}/${module} ${dst_dir}/${module}/ir + SRCS ${src_dir}/${module}/*.h ${src_dir}/${module}/details/*.h ${PADDLE_BINARY_DIR}/paddle/fluid/framework/framework.pb.h ${PADDLE_BINARY_DIR}/paddle/fluid/framework/data_feed.pb.h ${src_dir}/${module}/ir/memory_optimize_pass/*.h + ${src_dir}/${module}/ir/*.h ${src_dir}/${module}/fleet/*.h + DSTS ${dst_dir}/${module} ${dst_dir}/${module}/details ${dst_dir}/${module} ${dst_dir}/${module} ${dst_dir}/${module}/ir/memory_optimize_pass ${dst_dir}/${module}/ir ${dst_dir}/${module}/fleet ) set(module "memory") diff --git a/paddle/fluid/framework/CMakeLists.txt b/paddle/fluid/framework/CMakeLists.txt index 65bbbd77a9..79c7bde040 100644 --- a/paddle/fluid/framework/CMakeLists.txt +++ b/paddle/fluid/framework/CMakeLists.txt @@ -28,7 +28,6 @@ add_subdirectory(io) #ddim lib proto_library(framework_proto SRCS framework.proto) proto_library(data_feed_proto SRCS data_feed.proto) -proto_library(async_executor_proto SRCS data_feed.proto) proto_library(trainer_desc_proto SRCS trainer_desc.proto DEPS framework_proto data_feed_proto) @@ -190,7 +189,7 @@ else() pull_dense_worker.cc section_worker.cc device_worker_factory.cc data_set.cc DEPS op_registry device_context scope framework_proto data_feed_proto trainer_desc_proto glog lod_rank_table fs shell fleet_wrapper lodtensor_printer feed_fetch_method - graph_to_program_pass variable_helper ${NGRAPH_EXE_DEPS} timer data_feed_proto) + graph_to_program_pass variable_helper ${NGRAPH_EXE_DEPS} timer) cc_test(test_naive_executor SRCS naive_executor_test.cc DEPS naive_executor elementwise_add_op) endif() @@ -201,18 +200,6 @@ cc_library(parallel_executor SRCS parallel_executor.cc DEPS graph build_strategy fast_threaded_ssa_graph_executor variable_helper) -cc_library(async_executor SRCS async_executor.cc data_feed.cc data_feed_factory.cc - executor_thread_worker.cc multi_trainer.cc dist_multi_trainer.cc pipeline_trainer.cc - trainer_factory.cc trainer.cc device_worker.cc hogwild_worker.cc - downpour_worker.cc pull_dense_worker.cc section_worker.cc - device_worker_factory.cc data_set.cc dataset_factory.cc - DEPS op_registry device_context scope framework_proto - trainer_desc_proto glog lod_rank_table fleet_wrapper lodtensor_printer - feed_fetch_method graph_to_program_pass data_feed_proto - variable_helper timer fs shell) - - -cc_test(data_feed_test SRCS data_feed_test.cc DEPS async_executor) cc_library(prune SRCS prune.cc DEPS framework_proto) cc_test(prune_test SRCS prune_test.cc DEPS op_info prune recurrent_op device_context) cc_test(var_type_inference_test SRCS var_type_inference_test.cc DEPS op_registry diff --git a/paddle/fluid/framework/data_feed.cc b/paddle/fluid/framework/data_feed.cc index 697a383983..aa13e7f8e7 100644 --- a/paddle/fluid/framework/data_feed.cc +++ b/paddle/fluid/framework/data_feed.cc @@ -101,8 +101,7 @@ template void PrivateQueueDataFeed::SetQueueSize(int queue_size) { PADDLE_ENFORCE(queue_size > 0, "Illegal queue size: %d.", queue_size); queue_size_ = queue_size; - queue_ = std::unique_ptr>( - new paddle::operators::reader::BlockingQueue(queue_size_)); + queue_ = paddle::framework::MakeChannel(); } template @@ -125,7 +124,7 @@ void PrivateQueueDataFeed::ReadThread() { __fsetlocking(&*fp_, FSETLOCKING_BYCALLER); T instance; while (ParseOneInstanceFromPipe(&instance)) { - queue_->Send(instance); + queue_->Put(instance); } } queue_->Close(); @@ -137,10 +136,10 @@ int PrivateQueueDataFeed::Next() { #ifdef _LINUX CheckStart(); int index = 0; - T instance; T ins_vec; while (index < default_batch_size_) { - if (!queue_->Receive(&instance)) { + T instance; + if (!queue_->Get(instance)) { break; } AddInstanceToInsVec(&ins_vec, instance, index++); @@ -345,7 +344,7 @@ void MultiSlotDataFeed::ReadThread() { int ins_num = 0; while (ParseOneInstanceFromPipe(&instance)) { ins_num++; - queue_->Send(instance); + queue_->Put(instance); } VLOG(3) << "filename: " << filename << " inst num: " << ins_num; } diff --git a/paddle/fluid/framework/data_feed.h b/paddle/fluid/framework/data_feed.h index 93f14dd74f..d84e9df679 100644 --- a/paddle/fluid/framework/data_feed.h +++ b/paddle/fluid/framework/data_feed.h @@ -33,11 +33,9 @@ limitations under the License. */ #include "paddle/fluid/framework/blocking_queue.h" #include "paddle/fluid/framework/channel.h" #include "paddle/fluid/framework/data_feed.pb.h" -#include "paddle/fluid/framework/fleet/fleet_wrapper.h" #include "paddle/fluid/framework/lod_tensor.h" #include "paddle/fluid/framework/reader.h" #include "paddle/fluid/framework/variable.h" -#include "paddle/fluid/operators/reader/blocking_queue.h" #include "paddle/fluid/string/string_helper.h" namespace paddle { @@ -198,7 +196,7 @@ class PrivateQueueDataFeed : public DataFeed { size_t queue_size_; string::LineFileReader reader_; // The queue for store parsed data - std::unique_ptr> queue_; + std::shared_ptr> queue_; }; template diff --git a/paddle/fluid/framework/data_set.cc b/paddle/fluid/framework/data_set.cc index 119794e592..e03d948ea3 100644 --- a/paddle/fluid/framework/data_set.cc +++ b/paddle/fluid/framework/data_set.cc @@ -18,6 +18,7 @@ #include "google/protobuf/message.h" #include "google/protobuf/text_format.h" #include "paddle/fluid/framework/data_feed_factory.h" +#include "paddle/fluid/framework/fleet/fleet_wrapper.h" #include "paddle/fluid/framework/io/fs.h" #include "paddle/fluid/platform/timer.h" diff --git a/paddle/fluid/inference/CMakeLists.txt b/paddle/fluid/inference/CMakeLists.txt index 44eaf90371..83d91afa25 100644 --- a/paddle/fluid/inference/CMakeLists.txt +++ b/paddle/fluid/inference/CMakeLists.txt @@ -2,7 +2,7 @@ if(WITH_TESTING) include(tests/test.cmake) # some generic cmake funtion for inference endif() -set(FLUID_CORE_MODULES proto_desc memory lod_tensor executor) +set(FLUID_CORE_MODULES proto_desc memory lod_tensor executor data_feed_proto) # TODO(panyx0718): Should this be called paddle_fluid_inference_api_internal? cc_library(paddle_fluid_api diff --git a/paddle/fluid/pybind/CMakeLists.txt b/paddle/fluid/pybind/CMakeLists.txt index eeee507110..8ee03c7982 100644 --- a/paddle/fluid/pybind/CMakeLists.txt +++ b/paddle/fluid/pybind/CMakeLists.txt @@ -1,4 +1,4 @@ -set(PYBIND_DEPS pybind python proto_desc memory executor async_executor fleet_wrapper nccl_wrapper prune +set(PYBIND_DEPS pybind python proto_desc memory executor fleet_wrapper nccl_wrapper prune feed_fetch_method pass_builder parallel_executor profiler layer scope_pool tracer analysis_predictor imperative_profiler nccl_context) @@ -17,7 +17,6 @@ set(PYBIND_SRCS const_value.cc recordio.cc reader_py.cc - async_executor_py.cc fleet_wrapper_py.cc nccl_wrapper_py.cc data_set_py.cc diff --git a/paddle/fluid/pybind/async_executor_py.cc b/paddle/fluid/pybind/async_executor_py.cc deleted file mode 100644 index 009d13c243..0000000000 --- a/paddle/fluid/pybind/async_executor_py.cc +++ /dev/null @@ -1,72 +0,0 @@ -/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved. - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - -http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. */ -#include - -// To avoid conflicting definition in gcc-4.8.2 headers and pyconfig.h (2.7.3) -#ifdef _POSIX_C_SOURCE -#undef _POSIX_C_SOURCE -#endif - -#ifdef _XOPEN_SOURCE -#undef _XOPEN_SOURCE -#endif -#include -#include -#include - -#include "google/protobuf/io/zero_copy_stream_impl.h" -#include "google/protobuf/text_format.h" -#include "paddle/fluid/framework/async_executor.h" -#include "paddle/fluid/framework/data_feed.h" -#include "paddle/fluid/framework/data_feed.pb.h" -#include "paddle/fluid/framework/scope.h" -#include "paddle/fluid/inference/io.h" -#include "paddle/fluid/platform/place.h" -#include "paddle/fluid/platform/variant.h" -#include "paddle/fluid/pybind/async_executor_py.h" - -namespace py = pybind11; -namespace pd = paddle::framework; - -namespace paddle { -namespace pybind { -using set_name_func = void (pd::DataFeedDesc::*)(const std::string&); -#ifdef PADDLE_WITH_PSLIB -void BindAsyncExecutor(py::module* m) { - py::class_(*m, "AsyncExecutor") - .def(py::init([](framework::Scope* scope, const platform::Place& place) { - return std::unique_ptr( - new framework::AsyncExecutor(scope, place)); - })) - .def("run_from_files", &framework::AsyncExecutor::RunFromFile) - .def("init_server", &framework::AsyncExecutor::InitServer) - .def("init_worker", &framework::AsyncExecutor::InitWorker) - .def("start_server", &framework::AsyncExecutor::StartServer) - .def("stop_server", &framework::AsyncExecutor::StopServer) - .def("gather_servers", &framework::AsyncExecutor::GatherServers) - .def("init_model", &framework::AsyncExecutor::InitModel) - .def("save_model", &framework::AsyncExecutor::SaveModel); -} // end BindAsyncExecutor -#else -void BindAsyncExecutor(py::module* m) { - py::class_(*m, "AsyncExecutor") - .def(py::init([](framework::Scope* scope, const platform::Place& place) { - return std::unique_ptr( - new framework::AsyncExecutor(scope, place)); - })) - .def("run_from_files", &framework::AsyncExecutor::RunFromFile); -} // end BindAsyncExecutor -#endif -} // end namespace pybind -} // end namespace paddle diff --git a/paddle/fluid/pybind/async_executor_py.h b/paddle/fluid/pybind/async_executor_py.h deleted file mode 100644 index a99d6e0421..0000000000 --- a/paddle/fluid/pybind/async_executor_py.h +++ /dev/null @@ -1,28 +0,0 @@ -// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -#pragma once - -#include "pybind11/pybind11.h" -#include "pybind11/stl.h" - -namespace py = pybind11; - -namespace paddle { -namespace pybind { - -void BindAsyncExecutor(py::module* m); - -} // namespace pybind -} // namespace paddle diff --git a/paddle/fluid/pybind/pybind.cc b/paddle/fluid/pybind/pybind.cc index f0dcf91921..bd63517a8a 100644 --- a/paddle/fluid/pybind/pybind.cc +++ b/paddle/fluid/pybind/pybind.cc @@ -51,7 +51,6 @@ limitations under the License. */ #include "paddle/fluid/platform/init.h" #include "paddle/fluid/platform/place.h" #include "paddle/fluid/platform/profiler.h" -#include "paddle/fluid/pybind/async_executor_py.h" #include "paddle/fluid/pybind/const_value.h" #include "paddle/fluid/pybind/data_set_py.h" #include "paddle/fluid/pybind/exception.h" @@ -1609,7 +1608,6 @@ All parameter, weight, gradient are variables in Paddle. }); BindRecordIOWriter(&m); - BindAsyncExecutor(&m); BindFleetWrapper(&m); #ifndef _WIN32 BindNCCLWrapper(&m); diff --git a/paddle/fluid/train/demo/CMakeLists.txt b/paddle/fluid/train/demo/CMakeLists.txt index af033fa740..4e87f330e0 100644 --- a/paddle/fluid/train/demo/CMakeLists.txt +++ b/paddle/fluid/train/demo/CMakeLists.txt @@ -70,7 +70,7 @@ endif(APPLE) target_link_libraries(demo_trainer ${MACOS_LD_FLAGS} ${ARCHIVE_START} - ${PADDLE_LIB}/paddle/fluid/inference/libpaddle_fluid.a + ${PADDLE_LIB}/paddle/fluid/inference/libpaddle_fluid.so ${ARCHIVE_END} ${MATH_LIB} ${MKLDNN_LIB} -- GitLab