From d9991dccdd15366954f6219e4cc4c56586e338b5 Mon Sep 17 00:00:00 2001 From: wopeizl Date: Mon, 22 Apr 2019 17:57:00 +0800 Subject: [PATCH] =?UTF-8?q?add=20parallel=20build=20script=20to=20ci=20?= =?UTF-8?q?=E2=80=A6=20(#16901)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * add parallel build script to ci test=develop * 1. classify the test case as single card/two cards/multiple cards type 2. run test case according to the run type --- paddle/fluid/inference/api/CMakeLists.txt | 1 + .../fluid/inference/tests/book/CMakeLists.txt | 5 +- paddle/fluid/train/CMakeLists.txt | 2 + paddle/scripts/paddle_build.sh | 197 +++++++++++++++++- .../tests/book/high-level-api/CMakeLists.txt | 1 + .../fluid/tests/unittests/CMakeLists.txt | 10 + 6 files changed, 211 insertions(+), 5 deletions(-) diff --git a/paddle/fluid/inference/api/CMakeLists.txt b/paddle/fluid/inference/api/CMakeLists.txt index 882bb34683..a73f160dfc 100644 --- a/paddle/fluid/inference/api/CMakeLists.txt +++ b/paddle/fluid/inference/api/CMakeLists.txt @@ -56,6 +56,7 @@ if(WITH_TESTING) inference_base_test(test_api_impl SRCS api_impl_tester.cc DEPS ${inference_deps} ARGS --word2vec_dirname=${WORD2VEC_MODEL_DIR} --book_dirname=${PYTHON_TESTS_DIR}/book) set_tests_properties(test_api_impl PROPERTIES DEPENDS test_image_classification) + set_tests_properties(test_api_impl PROPERTIES LABELS "RUN_TYPE=EXCLUSIVE") endif() cc_test(test_analysis_predictor SRCS analysis_predictor_tester.cc DEPS analysis_predictor benchmark ${inference_deps} ARGS --dirname=${WORD2VEC_MODEL_DIR}) diff --git a/paddle/fluid/inference/tests/book/CMakeLists.txt b/paddle/fluid/inference/tests/book/CMakeLists.txt index 977155440d..aa8828c432 100644 --- a/paddle/fluid/inference/tests/book/CMakeLists.txt +++ b/paddle/fluid/inference/tests/book/CMakeLists.txt @@ -19,7 +19,9 @@ function(inference_test TARGET_NAME) DEPS paddle_fluid_origin ARGS --dirname=${PYTHON_TESTS_DIR}/book/${TARGET_NAME}${arg}.inference.model) set_tests_properties(test_inference_${TARGET_NAME}${arg} - PROPERTIES DEPENDS test_${TARGET_NAME}) + PROPERTIES DEPENDS test_${TARGET_NAME}) + set_tests_properties(test_inference_${TARGET_NAME}${arg} + PROPERTIES LABELS "RUN_TYPE=EXCLUSIVE") endforeach() endfunction(inference_test) @@ -45,3 +47,4 @@ cc_test(test_inference_nlp DEPS paddle_fluid_origin ARGS --model_path=${PADDLE_BINARY_DIR}/python/paddle/fluid/tests/book/recognize_digits_mlp.inference.model) +set_tests_properties(test_inference_nlp PROPERTIES LABELS "RUN_TYPE=EXCLUSIVE") diff --git a/paddle/fluid/train/CMakeLists.txt b/paddle/fluid/train/CMakeLists.txt index fae28fcb4c..0637ff4d73 100644 --- a/paddle/fluid/train/CMakeLists.txt +++ b/paddle/fluid/train/CMakeLists.txt @@ -20,6 +20,8 @@ function(train_test TARGET_NAME) ARGS --dirname=${PYTHON_TESTS_DIR}/book/${TARGET_NAME}${arg}.train.model/) set_tests_properties(test_train_${TARGET_NAME}${arg} PROPERTIES DEPENDS test_${TARGET_NAME}) + set_tests_properties(test_train_${TARGET_NAME}${arg} + PROPERTIES LABELS "RUN_TYPE=EXCLUSIVE") endforeach() endfunction(train_test) diff --git a/paddle/scripts/paddle_build.sh b/paddle/scripts/paddle_build.sh index 6f1b01b2d2..c896c2595f 100755 --- a/paddle/scripts/paddle_build.sh +++ b/paddle/scripts/paddle_build.sh @@ -561,6 +561,195 @@ function bind_test() { wait } +function parallel_test() { + mkdir -p ${PADDLE_ROOT}/build + cd ${PADDLE_ROOT}/build + if [ ${WITH_TESTING:-ON} == "ON" ] ; then + cat < ${CODE}" ; + EXIT_CODE=1; + fi + done + wait; # wait for all subshells to finish + + echo "EXIT_CODE => $EXIT_CODE" + if [[ "${EXIT_CODE}" != "0" ]]; then + exit "$EXIT_CODE" + fi + fi +} + +EXIT_CODE=0; +function caught_error() { + for job in `jobs -p`; do + # echo "PID => ${job}" + if ! wait ${job} ; then + echo "At least one test failed with exit code => $?" ; + EXIT_CODE=1; + fi + done +} + +function card_test() { + set -m + + # get the CUDA device count + CUDA_DEVICE_COUNT=$(nvidia-smi -L | wc -l) + + testcases=$1 + if (( $# > 1 )); then + cardnumber=$2 + if (( $cardnumber > $CUDA_DEVICE_COUNT )); then + cardnumber=$CUDA_DEVICE_COUNT + fi + else + cardnumber=$CUDA_DEVICE_COUNT + fi + + if [[ "$testcases" == "" ]]; then + return 0 + fi + + trap 'caught_error' CHLD + + NUM_PROC=$[CUDA_DEVICE_COUNT/$cardnumber] + for (( i = 0; i < $NUM_PROC; i++ )); do + # CUDA_VISIBLE_DEVICES http://acceleware.com/blog/cudavisibledevices-masking-gpus + # ctest -I https://cmake.org/cmake/help/v3.0/manual/ctest.1.html?highlight=ctest + cuda_list=() + for (( j = 0; j < cardnumber; j++ )); do + if [ $j -eq 0 ]; then + cuda_list=("$[i*cardnumber]") + else + cuda_list="$cuda_list,$[i*cardnumber+j]" + fi + done + # echo $cuda_list + if [ ${TESTING_DEBUG_MODE:-OFF} == "ON" ] ; then + if [[ $cardnumber == $CUDA_DEVICE_COUNT ]]; then + ctest -I $i,,$NUM_PROC -R "($testcases)" -V & + else + env CUDA_VISIBLE_DEVICES=$cuda_list ctest -I $i,,$NUM_PROC -R "($testcases)" -V & + fi + else + if [[ $cardnumber == $CUDA_DEVICE_COUNT ]]; then + ctest -I $i,,$NUM_PROC -R "($testcases)" --output-on-failure & + else + # echo "env CUDA_VISIBLE_DEVICES=$cuda_list ctest -I $i,,$NUM_PROC -R \"($testcases)\" --output-on-failure &" + env CUDA_VISIBLE_DEVICES=$cuda_list ctest -I $i,,$NUM_PROC -R "($testcases)" --output-on-failure & + fi + fi + done + + wait; # wait for all subshells to finish +} + +function aggresive_test() { + mkdir -p ${PADDLE_ROOT}/build + cd ${PADDLE_ROOT}/build + if [ ${WITH_TESTING:-ON} == "ON" ] ; then + cat <