prepare.sh 13.2 KB
Newer Older
S
stephon 已提交
1 2 3
#!/bin/bash
FILENAME=$1

G
fix  
gaotingquan 已提交
4
# MODE be one of ['lite_train_lite_infer' 'lite_train_whole_infer' 'whole_train_whole_infer',
H
HydrogenSulfate 已提交
5
#                 'whole_infer', 'cpp_infer', 'serving_infer',  'lite_infer']
S
stephon 已提交
6 7 8 9 10 11 12 13

MODE=$2

dataline=$(cat ${FILENAME})
# parser params
IFS=$'\n'
lines=(${dataline})

H
debug  
HydrogenSulfate 已提交
14
function func_parser_key() {
S
stephon 已提交
15 16 17 18 19 20 21
    strs=$1
    IFS=":"
    array=(${strs})
    tmp=${array[0]}
    echo ${tmp}
}

H
debug  
HydrogenSulfate 已提交
22
function func_parser_value() {
S
stephon 已提交
23 24 25 26 27 28
    strs=$1
    IFS=":"
    array=(${strs})
    if [ ${#array[*]} = 2 ]; then
        echo ${array[1]}
    else
H
debug  
HydrogenSulfate 已提交
29 30
        IFS="|"
        tmp="${array[1]}:${array[2]}"
S
stephon 已提交
31 32 33 34
        echo ${tmp}
    fi
}

H
debug  
HydrogenSulfate 已提交
35
function func_get_url_file_name() {
D
dongshuilong 已提交
36 37 38
    strs=$1
    IFS="/"
    array=(${strs})
H
debug  
HydrogenSulfate 已提交
39
    tmp=${array[${#array[@]} - 1]}
D
dongshuilong 已提交
40 41 42 43 44
    echo ${tmp}
}

model_name=$(func_parser_value "${lines[1]}")

H
HydrogenSulfate 已提交
45
if [[ ${MODE} = "cpp_infer" ]]; then
H
debug  
HydrogenSulfate 已提交
46
    if [ -d "./deploy/cpp/opencv-3.4.7/opencv3/" ] && [ $(md5sum ./deploy/cpp/opencv-3.4.7.tar.gz | awk -F ' ' '{print $1}') = "faa2b5950f8bee3f03118e600c74746a" ]; then
H
debug  
HydrogenSulfate 已提交
47 48 49 50 51 52 53 54 55 56 57 58 59 60 61
        echo "################### build opencv skipped ###################"
    else
        echo "################### build opencv ###################"
        rm -rf ./deploy/cpp/opencv-3.4.7.tar.gz ./deploy/cpp/opencv-3.4.7/
        pushd ./deploy/cpp/
        wget -nc https://paddleocr.bj.bcebos.com/dygraph_v2.0/test/opencv-3.4.7.tar.gz
        tar -xf opencv-3.4.7.tar.gz

        cd opencv-3.4.7/
        install_path=$(pwd)/opencv3
        rm -rf build
        mkdir build
        cd build

        cmake .. \
H
debug  
HydrogenSulfate 已提交
62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77
        -DCMAKE_INSTALL_PREFIX=${install_path} \
        -DCMAKE_BUILD_TYPE=Release \
        -DBUILD_SHARED_LIBS=OFF \
        -DWITH_IPP=OFF \
        -DBUILD_IPP_IW=OFF \
        -DWITH_LAPACK=OFF \
        -DWITH_EIGEN=OFF \
        -DCMAKE_INSTALL_LIBDIR=lib64 \
        -DWITH_ZLIB=ON \
        -DBUILD_ZLIB=ON \
        -DWITH_JPEG=ON \
        -DBUILD_JPEG=ON \
        -DWITH_PNG=ON \
        -DBUILD_PNG=ON \
        -DWITH_TIFF=ON \
        -DBUILD_TIFF=ON
H
debug  
HydrogenSulfate 已提交
78 79 80 81 82 83 84

        make -j
        make install
        cd ../../
        popd
        echo "################### build opencv finished ###################"
    fi
85 86
    if [[ ! -d "./deploy/cpp/paddle_inference/" ]]; then
        pushd ./deploy/cpp/
87
        PADDLEInfer=$3
88
        if [ "" = "$PADDLEInfer" ]; then
89
            wget -nc https://paddle-inference-lib.bj.bcebos.com/2.2.2/cxx_c/Linux/GPU/x86-64_gcc8.2_avx_mkl_cuda10.1_cudnn7.6.5_trt6.0.1.5/paddle_inference.tgz --no-check-certificate
90
            tar xf paddle_inference.tgz
91 92
        else
            wget -nc ${PADDLEInfer} --no-check-certificate
93 94 95
            tar_name=$(func_get_url_file_name "$PADDLEInfer")
            tar xf ${tar_name}
            if [ ! -d "paddle_inference" ]; then
96
                ln -s paddle_inference_install_dir paddle_inference
97
            fi
98
        fi
99 100
        popd
    fi
H
debug  
HydrogenSulfate 已提交
101 102 103 104 105 106 107 108 109
    if [[ $FILENAME == *infer_cpp_linux_gpu_cpu.txt ]]; then
        cpp_type=$(func_parser_value "${lines[2]}")
        cls_inference_model_dir=$(func_parser_value "${lines[3]}")
        det_inference_model_dir=$(func_parser_value "${lines[4]}")
        cls_inference_url=$(func_parser_value "${lines[5]}")
        det_inference_url=$(func_parser_value "${lines[6]}")

        if [[ $cpp_type == "cls" ]]; then
            eval "wget -nc $cls_inference_url"
H
HydrogenSulfate 已提交
110 111 112
            tar_name=$(func_get_url_file_name "$cls_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"
H
debug  
HydrogenSulfate 已提交
113

H
debug  
HydrogenSulfate 已提交
114 115 116 117 118 119 120 121
            # move '_int8' suffix in pact models
            if [[ ${tar_name} =~ "pact_infer" ]]; then
                cd ${cls_inference_model_dir}
                mv inference_int8.pdiparams inference.pdiparams
                mv inference_int8.pdmodel inference.pdmodel
                cd ..
            fi

H
debug  
HydrogenSulfate 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137
            cd dataset
            rm -rf ILSVRC2012
            wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_infer.tar
            tar xf whole_chain_infer.tar
            ln -s whole_chain_infer ILSVRC2012
            cd ..
        elif [[ $cpp_type == "shitu" ]]; then
            eval "wget -nc $cls_inference_url"
            tar_name=$(func_get_url_file_name "$cls_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"

            eval "wget -nc $det_inference_url"
            tar_name=$(func_get_url_file_name "$det_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"
H
debug  
HydrogenSulfate 已提交
138

H
debug  
HydrogenSulfate 已提交
139 140 141 142 143 144 145
            cd dataset
            wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/rec/data/drink_dataset_v1.0.tar
            tar -xf drink_dataset_v1.0.tar
        else
            echo "Wrong cpp type in config file in line 3. only support cls, shitu"
        fi
        exit 0
H
debug  
HydrogenSulfate 已提交
146
    else
H
debug  
HydrogenSulfate 已提交
147 148
        echo "use wrong config file"
        exit 1
H
debug  
HydrogenSulfate 已提交
149
    fi
D
dongshuilong 已提交
150 151
fi

S
stephon 已提交
152 153 154 155
model_name=$(func_parser_value "${lines[1]}")
model_url_value=$(func_parser_value "${lines[35]}")
model_url_key=$(func_parser_key "${lines[35]}")

156
if [[ $model_name == *ShiTu* ]]; then
H
debug  
HydrogenSulfate 已提交
157 158 159 160
    cd dataset
    rm -rf Aliproduct
    rm -rf train_reg_all_data.txt
    rm -rf demo_train
H
debug  
HydrogenSulfate 已提交
161
    wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
H
debug  
HydrogenSulfate 已提交
162 163 164 165 166 167 168
    tar -xf tipc_shitu_demo_data.tar
    ln -s tipc_shitu_demo_data Aliproduct
    ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
    ln -s tipc_shitu_demo_data/demo_train demo_train
    cd tipc_shitu_demo_data
    ln -s demo_test.txt val_list.txt
    cd ../../
H
debug  
HydrogenSulfate 已提交
169
    eval "wget -nc $model_url_value --no-check-certificate"
H
debug  
HydrogenSulfate 已提交
170 171
    mv general_PPLCNet_x2_5_pretrained_v1.0.pdparams GeneralRecognition_PPLCNet_x2_5_pretrained.pdparams
    exit 0
D
dongshuilong 已提交
172 173
fi

H
debug  
HydrogenSulfate 已提交
174
if [[ $FILENAME == *use_dali* ]]; then
L
lubin10 已提交
175 176 177 178
    python_name=$(func_parser_value "${lines[2]}")
    ${python_name} -m pip install --extra-index-url https://developer.download.nvidia.com/compute/redist/nightly --upgrade nvidia-dali-nightly-cuda102
fi

H
HydrogenSulfate 已提交
179
if [[ ${MODE} = "lite_train_lite_infer" ]] || [[ ${MODE} = "lite_train_whole_infer" ]]; then
180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
        ln -s demo_test.txt val_list.txt
        cd ../../
    else
        # pretrain lite train data
        cd dataset
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_little_train.tar --no-check-certificate
        tar xf whole_chain_little_train.tar
        ln -s whole_chain_little_train ILSVRC2012
        cd ILSVRC2012
        mv train.txt train_list.txt
        mv val.txt val_list.txt
        cp -r train/* val/
        cd ../../
    fi
H
HydrogenSulfate 已提交
206 207 208 209 210 211 212 213
    if [[ ${FILENAME} =~ "pact_infer" ]]; then
        # download pretrained model for PACT training
        pretrpretrained_model_url=$(func_parser_value "${lines[35]}")
        mkdir pretrained_model
        cd pretrained_model
        wget -nc ${pretrpretrained_model_url} --no-check-certificate
        cd ..
    fi
H
HydrogenSulfate 已提交
214
elif [[ ${MODE} = "whole_infer" ]]; then
S
stephon 已提交
215
    # download data
H
HydrogenSulfate 已提交
216 217 218 219 220 221 222 223 224 225 226
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
227
        rm -rf val_list.txt
H
HydrogenSulfate 已提交
228 229 230 231 232 233 234 235 236 237
        ln -s demo_test.txt val_list.txt
        cd ../../
    else
        cd dataset
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_infer.tar
        tar xf whole_chain_infer.tar
        ln -s whole_chain_infer ILSVRC2012
        cd ILSVRC2012
        mv val.txt val_list.txt
238
        rm -rf train_list.txt
H
HydrogenSulfate 已提交
239 240 241
        ln -s val_list.txt train_list.txt
        cd ../../
    fi
S
stephon 已提交
242 243
    # download inference or pretrained model
    eval "wget -nc $model_url_value"
244 245 246 247 248
    if [[ ${model_url_value} =~ ".tar" ]]; then
        tar_name=$(func_get_url_file_name "${model_url_value}")
        echo $tar_name
        rm -rf {tar_name}
        tar xf ${tar_name}
S
stephon 已提交
249
    fi
H
debug  
HydrogenSulfate 已提交
250 251 252
    if [[ $model_name == "SwinTransformer_large_patch4_window7_224" || $model_name == "SwinTransformer_large_patch4_window12_384" ]]; then
        cmd="mv ${model_name}_22kto1k_pretrained.pdparams ${model_name}_pretrained.pdparams"
        eval $cmd
D
dongshuilong 已提交
253 254
    fi

H
HydrogenSulfate 已提交
255
elif [[ ${MODE} = "whole_train_whole_infer" ]]; then
S
stephon 已提交
256 257 258 259 260
    cd dataset
    rm -rf ILSVRC2012
    wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_CIFAR100.tar
    tar xf whole_chain_CIFAR100.tar
    ln -s whole_chain_CIFAR100 ILSVRC2012
G
fix  
gaotingquan 已提交
261
    cd ILSVRC2012
S
stephon 已提交
262
    mv train.txt train_list.txt
D
dongshuilong 已提交
263
    mv test.txt val_list.txt
S
stephon 已提交
264
    cd ../../
H
HydrogenSulfate 已提交
265 266 267 268 269 270 271 272
    if [[ ${FILENAME} =~ "pact_infer" ]]; then
        # download pretrained model for PACT training
        pretrpretrained_model_url=$(func_parser_value "${lines[35]}")
        mkdir pretrained_model
        cd pretrained_model
        wget -nc ${pretrpretrained_model_url} --no-check-certificate
        cd ..
    fi
S
stephon 已提交
273 274
fi

H
HydrogenSulfate 已提交
275
if [[ ${MODE} = "serving_infer" ]]; then
S
stephon 已提交
276
    # prepare serving env
277
    python_name=$(func_parser_value "${lines[2]}")
H
fix  
HydrogenSulfate 已提交
278
    if [[ ${model_name} = "PPShiTu" ]]; then
H
debug  
HydrogenSulfate 已提交
279 280 281 282
        cls_inference_model_url=$(func_parser_value "${lines[3]}")
        cls_tar_name=$(func_get_url_file_name "${cls_inference_model_url}")
        det_inference_model_url=$(func_parser_value "${lines[4]}")
        det_tar_name=$(func_get_url_file_name "${det_inference_model_url}")
283
        cd ./deploy
H
HydrogenSulfate 已提交
284 285
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/rec/data/drink_dataset_v1.0.tar --no-check-certificate
        tar -xf drink_dataset_v1.0.tar
286 287 288 289 290
        mkdir models
        cd models
        wget -nc ${cls_inference_model_url} && tar xf ${cls_tar_name}
        wget -nc ${det_inference_model_url} && tar xf ${det_tar_name}
        cd ..
H
debug  
HydrogenSulfate 已提交
291 292 293 294
    else
        cls_inference_model_url=$(func_parser_value "${lines[3]}")
        cls_tar_name=$(func_get_url_file_name "${cls_inference_model_url}")
        cd ./deploy/paddleserving
H
debug  
HydrogenSulfate 已提交
295 296 297 298 299 300 301 302 303 304 305 306
        wget -nc ${cls_inference_model_url}
        tar xf ${cls_tar_name}

        # move '_int8' suffix in pact models
        if [[ ${cls_tar_name} =~ "pact_infer" ]]; then
            cls_inference_model_dir=${cls_tar_name%%.tar}
            cd ${cls_inference_model_dir}
            mv inference_int8.pdiparams inference.pdiparams
            mv inference_int8.pdmodel inference.pdmodel
            cd ..
        fi

H
debug  
HydrogenSulfate 已提交
307
        cd ../../
308
    fi
S
stephon 已提交
309 310 311
    unset http_proxy
    unset https_proxy
fi
L
lubin10 已提交
312

H
HydrogenSulfate 已提交
313
if [[ ${MODE} = "paddle2onnx_infer" ]]; then
L
lubin10 已提交
314 315
    # prepare paddle2onnx env
    python_name=$(func_parser_value "${lines[2]}")
H
HydrogenSulfate 已提交
316 317 318
    inference_model_url=$(func_parser_value "${lines[10]}")
    tar_name=${inference_model_url##*/}

319
    ${python_name} -m pip install paddle2onnx
L
lubin10 已提交
320
    ${python_name} -m pip install onnxruntime
321 322 323 324 325 326 327 328 329 330 331
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
332
        rm -rf val_list.txt
333 334 335 336 337
        ln -s demo_test.txt val_list.txt
        cd ../../
        eval "wget -nc $model_url_value --no-check-certificate"
        mv general_PPLCNet_x2_5_pretrained_v1.0.pdparams GeneralRecognition_PPLCNet_x2_5_pretrained.pdparams
    fi
H
HydrogenSulfate 已提交
338 339 340 341 342 343
    cd deploy
    mkdir models
    cd models
    wget -nc ${inference_model_url}
    tar xf ${tar_name}
    cd ../../
L
lubin10 已提交
344
fi
D
dongshuilong 已提交
345

H
HydrogenSulfate 已提交
346
if [[ ${MODE} = "benchmark_train" ]]; then
D
dongshuilong 已提交
347 348
    pip install -r requirements.txt
    cd dataset
349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369

    if [[ $model_name == *GeneralRecognition* ]]; then
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
        ln -s demo_test.txt val_list.txt
    else
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/ImageNet1k/ILSVRC2012_val.tar
        tar xf ILSVRC2012_val.tar
        ln -s ILSVRC2012_val ILSVRC2012
        cd ILSVRC2012
        rm -rf train_list.txt
        ln -s val_list.txt train_list.txt
    fi
D
dongshuilong 已提交
370
    cd ../../
371

D
dongshuilong 已提交
372
fi