#!/bin/bash function usage() { echo "$0" echo -e "\t -m vm config file" echo -e "\t -t task file" echo -e "\t -b branch" echo -e "\t -l log dir" echo -e "\t -e enterprise edition" echo -e "\t -o default timeout value" echo -e "\t -w log web server" echo -e "\t -h help" } ent=0 while getopts "m:t:b:l:o:w:eh" opt; do case $opt in m) config_file=$OPTARG ;; t) t_file=$OPTARG ;; b) branch=$OPTARG ;; l) log_dir=$OPTARG ;; e) ent=1 ;; o) timeout_param="-o $OPTARG" ;; w) web_server=$OPTARG ;; h) usage exit 0 ;; \?) echo "Invalid option: -$OPTARG" usage exit 0 ;; esac done #config_file=$1 if [ -z $config_file ]; then usage exit 1 fi if [ ! -f $config_file ]; then echo "$config_file not found" usage exit 1 fi #t_file=$2 if [ -z $t_file ]; then usage exit 1 fi if [ ! -f $t_file ]; then echo "$t_file not found" usage exit 1 fi date_tag=`date +%Y%m%d-%H%M%S` test_log_dir=${branch}_${date_tag} if [ -z $log_dir ]; then log_dir="log/${test_log_dir}" else log_dir="$log_dir/${test_log_dir}" fi hosts=() usernames=() passwords=() workdirs=() threads=() i=0 while [ 1 ]; do host=`jq .[$i].host $config_file` if [ "$host" = "null" ]; then break fi username=`jq .[$i].username $config_file` if [ "$username" = "null" ]; then break fi password=`jq .[$i].password $config_file` if [ "$password" = "null" ]; then password="" fi workdir=`jq .[$i].workdir $config_file` if [ "$workdir" = "null" ]; then break fi thread=`jq .[$i].thread $config_file` if [ "$thread" = "null" ]; then break fi hosts[i]=`echo $host|sed 's/\"$//'|sed 's/^\"//'` usernames[i]=`echo $username|sed 's/\"$//'|sed 's/^\"//'` passwords[i]=`echo $password|sed 's/\"$//'|sed 's/^\"//'` workdirs[i]=`echo $workdir|sed 's/\"$//'|sed 's/^\"//'` threads[i]=$thread i=$(( i + 1 )) done function prepare_cases() { cat $t_file >>$task_file local i=0 while [ $i -lt $1 ]; do echo "%%FINISHED%%" >>$task_file i=$(( i + 1 )) done } function clean_tmp() { # clean tmp dir local index=$1 local ssh_script="sshpass -p ${passwords[index]} ssh -o StrictHostKeyChecking=no ${usernames[index]}@${hosts[index]}" if [ -z ${passwords[index]} ]; then ssh_script="ssh -o StrictHostKeyChecking=no ${usernames[index]}@${hosts[index]}" fi local cmd="${ssh_script} rm -rf ${workdirs[index]}/tmp" ${cmd} } function run_thread() { local index=$1 local thread_no=$2 local runcase_script="sshpass -p ${passwords[index]} ssh -o StrictHostKeyChecking=no ${usernames[index]}@${hosts[index]}" if [ -z ${passwords[index]} ]; then runcase_script="ssh -o StrictHostKeyChecking=no ${usernames[index]}@${hosts[index]}" fi local count=0 local script="${workdirs[index]}/TDengine/tests/parallel_test/run_container.sh" if [ $ent -ne 0 ]; then local script="${workdirs[index]}/TDinternal/community/tests/parallel_test/run_container.sh -e" fi local cmd="${runcase_script} ${script}" # script="echo" while [ 1 ]; do local line=`flock -x $lock_file -c "head -n1 $task_file;sed -i \"1d\" $task_file"` if [ "x$line" = "x%%FINISHED%%" ]; then # echo "$index . $thread_no EXIT" break fi if [ -z "$line" ]; then continue fi echo "$line"|grep -q "^#" if [ $? -eq 0 ]; then continue fi local case_redo_time=`echo "$line"|cut -d, -f2` if [ -z "$case_redo_time" ]; then case_redo_time=${DEFAULT_RETRY_TIME:-2} fi local case_build_san=`echo "$line"|cut -d, -f3` if [ "${case_build_san}" == "y" ]; then case_build_san="y" elif [[ "${case_build_san}" == "n" ]] || [[ "${case_build_san}" == "" ]]; then case_build_san="n" else usage exit 1 fi local exec_dir=`echo "$line"|cut -d, -f4` local case_cmd=`echo "$line"|cut -d, -f5` local case_file="" echo "$case_cmd"|grep -q "\.sh" if [ $? -eq 0 ]; then case_file=`echo "$case_cmd"|grep -o ".*\.sh"|awk '{print $NF}'` fi echo "$case_cmd"|grep -q "^python3" if [ $? -eq 0 ]; then case_file=`echo "$case_cmd"|grep -o ".*\.py"|awk '{print $NF}'` fi echo "$case_cmd"|grep -q "^./pytest.sh" if [ $? -eq 0 ]; then case_file=`echo "$case_cmd"|grep -o ".*\.py"|awk '{print $NF}'` fi echo "$case_cmd"|grep -q "\.sim" if [ $? -eq 0 ]; then case_file=`echo "$case_cmd"|grep -o ".*\.sim"|awk '{print $NF}'` fi if [ -z "$case_file" ]; then case_file=`echo "$case_cmd"|awk '{print $NF}'` fi if [ -z "$case_file" ]; then continue fi case_file="$exec_dir/${case_file}.${index}.${thread_no}.${count}" count=$(( count + 1 )) local case_path=`dirname "$case_file"` if [ ! -z "$case_path" ]; then mkdir -p $log_dir/$case_path fi cmd="${runcase_script} ${script} -w ${workdirs[index]} -c \"${case_cmd}\" -t ${thread_no} -d ${exec_dir} -s ${case_build_san} ${timeout_param}" # echo "$thread_no $count $cmd" local ret=0 local redo_count=1 local case_log_file=$log_dir/${case_file}.txt start_time=`date +%s` local case_index=`flock -x $lock_file -c "sh -c \"echo \\\$(( \\\$( cat $index_file ) + 1 )) | tee $index_file\""` case_index=`printf "%5d" $case_index` local case_info=`echo "$line"|cut -d, -f 3,4,5` while [ ${redo_count} -lt 6 ]; do if [ -f $case_log_file ]; then cp $case_log_file $log_dir/$case_file.${redo_count}.redotxt fi echo "${hosts[index]}-${thread_no} order:${count}, redo:${redo_count} task:${line}" >$case_log_file local current_time=`date "+%Y-%m-%d %H:%M:%S"` echo -e "$case_index \e[33m START >>>>> \e[0m ${case_info} \e[33m[$current_time]\e[0m" echo "$current_time" >>$case_log_file local real_start_time=`date +%s` # $cmd 2>&1 | tee -a $case_log_file # ret=${PIPESTATUS[0]} $cmd >>$case_log_file 2>&1 ret=$? local real_end_time=`date +%s` local time_elapsed=$(( real_end_time - real_start_time )) echo "execute time: ${time_elapsed}s" >>$case_log_file current_time=`date "+%Y-%m-%d %H:%M:%S"` echo "${hosts[index]} $current_time exit code:${ret}" >>$case_log_file if [ $ret -eq 0 ]; then break fi redo=0 grep -q "wait too long for taosd start" $case_log_file if [ $? -eq 0 ]; then redo=1 fi grep -q "kex_exchange_identification: Connection closed by remote host" $case_log_file if [ $? -eq 0 ]; then redo=1 fi grep -q "ssh_exchange_identification: Connection closed by remote host" $case_log_file if [ $? -eq 0 ]; then redo=1 fi grep -q "kex_exchange_identification: read: Connection reset by peer" $case_log_file if [ $? -eq 0 ]; then redo=1 fi grep -q "Database not ready" $case_log_file if [ $? -eq 0 ]; then redo=1 fi grep -q "Unable to establish connection" $case_log_file if [ $? -eq 0 ]; then redo=1 fi if [ $redo_count -lt $case_redo_time ]; then redo=1 fi if [ $redo -eq 0 ]; then break fi redo_count=$(( redo_count + 1 )) done end_time=`date +%s` echo >>$case_log_file total_time=$(( end_time - start_time )) echo "${hosts[index]} total time: ${total_time}s" >>$case_log_file # echo "$thread_no ${line} DONE" if [ $ret -eq 0 ]; then echo -e "$case_index \e[34m DONE <<<<< \e[0m ${case_info} \e[34m[${total_time}s]\e[0m \e[32m success\e[0m" flock -x $lock_file -c "echo \"${case_info}|success|${total_time}\" >>${success_case_file}" else if [ ! -z ${web_server} ]; then flock -x $lock_file -c "echo -e \"${hosts[index]} ret:${ret} ${line}\n ${web_server}/$test_log_dir/${case_file}.txt\" >>${failed_case_file}" else flock -x $lock_file -c "echo -e \"${hosts[index]} ret:${ret} ${line}\n log file: ${case_log_file}\" >>${failed_case_file}" fi mkdir -p $log_dir/${case_file}.coredump local remote_coredump_dir="${workdirs[index]}/tmp/thread_volume/$thread_no/coredump" local scpcmd="sshpass -p ${passwords[index]} scp -o StrictHostKeyChecking=no -r ${usernames[index]}@${hosts[index]}" if [ -z ${passwords[index]} ]; then scpcmd="scp -o StrictHostKeyChecking=no -r ${usernames[index]}@${hosts[index]}" fi cmd="$scpcmd:${remote_coredump_dir}/* $log_dir/${case_file}.coredump/" $cmd # 2>/dev/null local corefile=`ls $log_dir/${case_file}.coredump/` echo -e "$case_index \e[34m DONE <<<<< \e[0m ${case_info} \e[34m[${total_time}s]\e[0m \e[31m failed\e[0m" echo "=========================log============================" cat $case_log_file echo "=====================================================" echo -e "\e[34m log file: $case_log_file \e[0m" if [ ! -z "${web_server}" ]; then echo "${web_server}/$test_log_dir/${case_file}.txt" fi if [ ! -z "$corefile" ]; then echo -e "\e[34m corefiles: $corefile \e[0m" local build_dir=$log_dir/build_${hosts[index]} local remote_build_dir="${workdirs[index]}/TDengine/debug/build" if [ $ent -ne 0 ]; then remote_build_dir="${workdirs[index]}/TDinternal/debug/build" fi mkdir $build_dir 2>/dev/null if [ $? -eq 0 ]; then # scp build binary cmd="$scpcmd:${remote_build_dir}/* ${build_dir}/" echo "$cmd" $cmd >/dev/null fi fi # get remote sim dir local remote_sim_dir="${workdirs[index]}/tmp/thread_volume/$thread_no" local tarcmd="sshpass -p ${passwords[index]} ssh -o StrictHostKeyChecking=no -r ${usernames[index]}@${hosts[index]}" if [ -z ${passwords[index]} ]; then tarcmd="ssh -o StrictHostKeyChecking=no ${usernames[index]}@${hosts[index]}" fi cmd="$tarcmd sh -c \"cd $remote_sim_dir; tar -czf sim.tar.gz sim\"" $cmd local remote_sim_tar="${workdirs[index]}/tmp/thread_volume/$thread_no/sim.tar.gz" scpcmd="sshpass -p ${passwords[index]} scp -o StrictHostKeyChecking=no -r ${usernames[index]}@${hosts[index]}" if [ -z ${passwords[index]} ]; then scpcmd="scp -o StrictHostKeyChecking=no -r ${usernames[index]}@${hosts[index]}" fi cmd="$scpcmd:${remote_sim_tar} $log_dir/${case_file}.sim.tar.gz" $cmd # backup source code (disabled) source_tar_dir=$log_dir/TDengine_${hosts[index]} source_tar_file=TDengine.tar.gz if [ $ent -ne 0 ]; then source_tar_dir=$log_dir/TDinternal_${hosts[index]} source_tar_file=TDinternal.tar.gz fi mkdir $source_tar_dir 2>/dev/null if [ $? -eq 0 ]; then cmd="$scpcmd:${workdirs[index]}/$source_tar_file $source_tar_dir" # echo "$cmd" # $cmd fi fi done } # echo "hosts: ${hosts[@]}" # echo "usernames: ${usernames[@]}" # echo "passwords: ${passwords[@]}" # echo "workdirs: ${workdirs[@]}" # echo "threads: ${threads[@]}" # TODO: check host accessibility i=0 while [ $i -lt ${#hosts[*]} ]; do clean_tmp $i & i=$(( i + 1 )) done wait mkdir -p $log_dir rm -rf $log_dir/* task_file=$log_dir/$$.task lock_file=$log_dir/$$.lock index_file=$log_dir/case_index.txt stat_file=$log_dir/stat.txt failed_case_file=$log_dir/failed.txt success_case_file=$log_dir/success.txt echo "0" >$index_file i=0 j=0 while [ $i -lt ${#hosts[*]} ]; do j=$(( j + threads[i] )) i=$(( i + 1 )) done prepare_cases $j i=0 while [ $i -lt ${#hosts[*]} ]; do j=0 while [ $j -lt ${threads[i]} ]; do run_thread $i $j & j=$(( j + 1 )) done i=$(( i + 1 )) done wait rm -f $lock_file rm -f $task_file # docker ps -a|grep -v CONTAINER|awk '{print $1}'|xargs docker rm -f echo "=====================================================================" echo "log dir: $log_dir" total_cases=`cat $index_file` failed_cases=0 if [ -f $failed_case_file ]; then if [ ! -z "$web_server" ]; then failed_cases=`grep -v "$web_server" $failed_case_file|wc -l` else failed_cases=`grep -v "log file:" $failed_case_file|wc -l` fi fi success_cases=$(( total_cases - failed_cases )) echo "Total Cases: $total_cases" >$stat_file echo "Successful: $success_cases" >>$stat_file echo "Failed: $failed_cases" >>$stat_file cat $stat_file RET=0 i=1 if [ -f "${failed_case_file}" ]; then echo "=====================================================" while read line; do if [ ! -z "${web_server}" ]; then echo "$line"|grep -q "${web_server}" if [ $? -eq 0 ]; then echo " $line" continue fi else echo "$line"|grep -q "log file:" if [ $? -eq 0 ]; then echo " $line" continue fi fi line=`echo "$line"|cut -d, -f 3,4,5` echo -e "$i. $line \e[31m failed\e[0m" >&2 i=$(( i + 1 )) done <${failed_case_file} RET=1 fi echo "${log_dir}" >&2 date exit $RET