prepare.sh 13.2 KB
Newer Older
S
stephon 已提交
1 2 3
#!/bin/bash
FILENAME=$1

G
fix  
gaotingquan 已提交
4
# MODE be one of ['lite_train_lite_infer' 'lite_train_whole_infer' 'whole_train_whole_infer',
H
HydrogenSulfate 已提交
5
#                 'whole_infer', 'cpp_infer', 'serving_infer',  'lite_infer']
S
stephon 已提交
6 7 8 9 10 11 12 13

MODE=$2

dataline=$(cat ${FILENAME})
# parser params
IFS=$'\n'
lines=(${dataline})

H
debug  
HydrogenSulfate 已提交
14
function func_parser_key() {
S
stephon 已提交
15 16 17 18 19 20 21
    strs=$1
    IFS=":"
    array=(${strs})
    tmp=${array[0]}
    echo ${tmp}
}

H
debug  
HydrogenSulfate 已提交
22
function func_parser_value() {
S
stephon 已提交
23 24 25 26 27 28
    strs=$1
    IFS=":"
    array=(${strs})
    if [ ${#array[*]} = 2 ]; then
        echo ${array[1]}
    else
H
debug  
HydrogenSulfate 已提交
29 30
        IFS="|"
        tmp="${array[1]}:${array[2]}"
S
stephon 已提交
31 32 33 34
        echo ${tmp}
    fi
}

H
debug  
HydrogenSulfate 已提交
35
function func_get_url_file_name() {
D
dongshuilong 已提交
36 37 38
    strs=$1
    IFS="/"
    array=(${strs})
H
debug  
HydrogenSulfate 已提交
39
    tmp=${array[${#array[@]} - 1]}
D
dongshuilong 已提交
40 41 42 43 44
    echo ${tmp}
}

model_name=$(func_parser_value "${lines[1]}")

G
gaotingquan 已提交
45 46 47
# install paddleclas whl
python setup.py install

H
HydrogenSulfate 已提交
48
if [[ ${MODE} = "cpp_infer" ]]; then
H
debug  
HydrogenSulfate 已提交
49
    if [ -d "./deploy/cpp/opencv-3.4.7/opencv3/" ] && [ $(md5sum ./deploy/cpp/opencv-3.4.7.tar.gz | awk -F ' ' '{print $1}') = "faa2b5950f8bee3f03118e600c74746a" ]; then
H
debug  
HydrogenSulfate 已提交
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
        echo "################### build opencv skipped ###################"
    else
        echo "################### build opencv ###################"
        rm -rf ./deploy/cpp/opencv-3.4.7.tar.gz ./deploy/cpp/opencv-3.4.7/
        pushd ./deploy/cpp/
        wget -nc https://paddleocr.bj.bcebos.com/dygraph_v2.0/test/opencv-3.4.7.tar.gz
        tar -xf opencv-3.4.7.tar.gz

        cd opencv-3.4.7/
        install_path=$(pwd)/opencv3
        rm -rf build
        mkdir build
        cd build

        cmake .. \
H
debug  
HydrogenSulfate 已提交
65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
        -DCMAKE_INSTALL_PREFIX=${install_path} \
        -DCMAKE_BUILD_TYPE=Release \
        -DBUILD_SHARED_LIBS=OFF \
        -DWITH_IPP=OFF \
        -DBUILD_IPP_IW=OFF \
        -DWITH_LAPACK=OFF \
        -DWITH_EIGEN=OFF \
        -DCMAKE_INSTALL_LIBDIR=lib64 \
        -DWITH_ZLIB=ON \
        -DBUILD_ZLIB=ON \
        -DWITH_JPEG=ON \
        -DBUILD_JPEG=ON \
        -DWITH_PNG=ON \
        -DBUILD_PNG=ON \
        -DWITH_TIFF=ON \
        -DBUILD_TIFF=ON
H
debug  
HydrogenSulfate 已提交
81 82 83 84 85 86 87

        make -j
        make install
        cd ../../
        popd
        echo "################### build opencv finished ###################"
    fi
88 89
    if [[ ! -d "./deploy/cpp/paddle_inference/" ]]; then
        pushd ./deploy/cpp/
90
        PADDLEInfer=$3
91
        if [ "" = "$PADDLEInfer" ]; then
92
            wget -nc https://paddle-inference-lib.bj.bcebos.com/2.2.2/cxx_c/Linux/GPU/x86-64_gcc8.2_avx_mkl_cuda10.1_cudnn7.6.5_trt6.0.1.5/paddle_inference.tgz --no-check-certificate
93
            tar xf paddle_inference.tgz
94 95
        else
            wget -nc ${PADDLEInfer} --no-check-certificate
96 97 98
            tar_name=$(func_get_url_file_name "$PADDLEInfer")
            tar xf ${tar_name}
            if [ ! -d "paddle_inference" ]; then
99
                ln -s paddle_inference_install_dir paddle_inference
100
            fi
101
        fi
102 103
        popd
    fi
H
debug  
HydrogenSulfate 已提交
104 105 106 107 108 109 110 111 112
    if [[ $FILENAME == *infer_cpp_linux_gpu_cpu.txt ]]; then
        cpp_type=$(func_parser_value "${lines[2]}")
        cls_inference_model_dir=$(func_parser_value "${lines[3]}")
        det_inference_model_dir=$(func_parser_value "${lines[4]}")
        cls_inference_url=$(func_parser_value "${lines[5]}")
        det_inference_url=$(func_parser_value "${lines[6]}")

        if [[ $cpp_type == "cls" ]]; then
            eval "wget -nc $cls_inference_url"
H
HydrogenSulfate 已提交
113 114 115
            tar_name=$(func_get_url_file_name "$cls_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"
H
debug  
HydrogenSulfate 已提交
116

H
debug  
HydrogenSulfate 已提交
117 118 119 120 121 122 123 124
            # move '_int8' suffix in pact models
            if [[ ${tar_name} =~ "pact_infer" ]]; then
                cd ${cls_inference_model_dir}
                mv inference_int8.pdiparams inference.pdiparams
                mv inference_int8.pdmodel inference.pdmodel
                cd ..
            fi

H
debug  
HydrogenSulfate 已提交
125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140
            cd dataset
            rm -rf ILSVRC2012
            wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_infer.tar
            tar xf whole_chain_infer.tar
            ln -s whole_chain_infer ILSVRC2012
            cd ..
        elif [[ $cpp_type == "shitu" ]]; then
            eval "wget -nc $cls_inference_url"
            tar_name=$(func_get_url_file_name "$cls_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"

            eval "wget -nc $det_inference_url"
            tar_name=$(func_get_url_file_name "$det_inference_url")
            model_dir=${tar_name%.*}
            eval "tar xf ${tar_name}"
H
debug  
HydrogenSulfate 已提交
141

H
debug  
HydrogenSulfate 已提交
142 143 144 145 146 147 148
            cd dataset
            wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/rec/data/drink_dataset_v1.0.tar
            tar -xf drink_dataset_v1.0.tar
        else
            echo "Wrong cpp type in config file in line 3. only support cls, shitu"
        fi
        exit 0
H
debug  
HydrogenSulfate 已提交
149
    else
H
debug  
HydrogenSulfate 已提交
150 151
        echo "use wrong config file"
        exit 1
H
debug  
HydrogenSulfate 已提交
152
    fi
D
dongshuilong 已提交
153 154
fi

S
stephon 已提交
155 156 157 158
model_name=$(func_parser_value "${lines[1]}")
model_url_value=$(func_parser_value "${lines[35]}")
model_url_key=$(func_parser_key "${lines[35]}")

159
if [[ $model_name == *ShiTu* ]]; then
H
debug  
HydrogenSulfate 已提交
160 161 162 163
    cd dataset
    rm -rf Aliproduct
    rm -rf train_reg_all_data.txt
    rm -rf demo_train
H
debug  
HydrogenSulfate 已提交
164
    wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
H
debug  
HydrogenSulfate 已提交
165 166 167 168 169 170 171
    tar -xf tipc_shitu_demo_data.tar
    ln -s tipc_shitu_demo_data Aliproduct
    ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
    ln -s tipc_shitu_demo_data/demo_train demo_train
    cd tipc_shitu_demo_data
    ln -s demo_test.txt val_list.txt
    cd ../../
H
debug  
HydrogenSulfate 已提交
172
    eval "wget -nc $model_url_value --no-check-certificate"
H
debug  
HydrogenSulfate 已提交
173 174
    mv general_PPLCNet_x2_5_pretrained_v1.0.pdparams GeneralRecognition_PPLCNet_x2_5_pretrained.pdparams
    exit 0
D
dongshuilong 已提交
175 176
fi

H
debug  
HydrogenSulfate 已提交
177
if [[ $FILENAME == *use_dali* ]]; then
L
lubin10 已提交
178 179 180 181
    python_name=$(func_parser_value "${lines[2]}")
    ${python_name} -m pip install --extra-index-url https://developer.download.nvidia.com/compute/redist/nightly --upgrade nvidia-dali-nightly-cuda102
fi

H
HydrogenSulfate 已提交
182
if [[ ${MODE} = "lite_train_lite_infer" ]] || [[ ${MODE} = "lite_train_whole_infer" ]]; then
183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
        ln -s demo_test.txt val_list.txt
        cd ../../
    else
        # pretrain lite train data
        cd dataset
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_little_train.tar --no-check-certificate
        tar xf whole_chain_little_train.tar
        ln -s whole_chain_little_train ILSVRC2012
        cd ILSVRC2012
        mv train.txt train_list.txt
        mv val.txt val_list.txt
        cp -r train/* val/
        cd ../../
    fi
H
HydrogenSulfate 已提交
209 210 211 212 213 214 215 216
    if [[ ${FILENAME} =~ "pact_infer" ]]; then
        # download pretrained model for PACT training
        pretrpretrained_model_url=$(func_parser_value "${lines[35]}")
        mkdir pretrained_model
        cd pretrained_model
        wget -nc ${pretrpretrained_model_url} --no-check-certificate
        cd ..
    fi
H
HydrogenSulfate 已提交
217
elif [[ ${MODE} = "whole_infer" ]]; then
S
stephon 已提交
218
    # download data
H
HydrogenSulfate 已提交
219 220 221 222 223 224 225 226 227 228 229
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
230
        rm -rf val_list.txt
H
HydrogenSulfate 已提交
231 232 233 234 235 236 237 238 239 240
        ln -s demo_test.txt val_list.txt
        cd ../../
    else
        cd dataset
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_infer.tar
        tar xf whole_chain_infer.tar
        ln -s whole_chain_infer ILSVRC2012
        cd ILSVRC2012
        mv val.txt val_list.txt
241
        rm -rf train_list.txt
H
HydrogenSulfate 已提交
242 243 244
        ln -s val_list.txt train_list.txt
        cd ../../
    fi
S
stephon 已提交
245 246
    # download inference or pretrained model
    eval "wget -nc $model_url_value"
247 248 249 250 251
    if [[ ${model_url_value} =~ ".tar" ]]; then
        tar_name=$(func_get_url_file_name "${model_url_value}")
        echo $tar_name
        rm -rf {tar_name}
        tar xf ${tar_name}
S
stephon 已提交
252
    fi
H
debug  
HydrogenSulfate 已提交
253 254 255
    if [[ $model_name == "SwinTransformer_large_patch4_window7_224" || $model_name == "SwinTransformer_large_patch4_window12_384" ]]; then
        cmd="mv ${model_name}_22kto1k_pretrained.pdparams ${model_name}_pretrained.pdparams"
        eval $cmd
D
dongshuilong 已提交
256 257
    fi

H
HydrogenSulfate 已提交
258
elif [[ ${MODE} = "whole_train_whole_infer" ]]; then
S
stephon 已提交
259 260 261 262 263
    cd dataset
    rm -rf ILSVRC2012
    wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/whole_chain_CIFAR100.tar
    tar xf whole_chain_CIFAR100.tar
    ln -s whole_chain_CIFAR100 ILSVRC2012
G
fix  
gaotingquan 已提交
264
    cd ILSVRC2012
S
stephon 已提交
265
    mv train.txt train_list.txt
D
dongshuilong 已提交
266
    mv test.txt val_list.txt
S
stephon 已提交
267
    cd ../../
H
HydrogenSulfate 已提交
268 269 270 271 272 273 274 275
    if [[ ${FILENAME} =~ "pact_infer" ]]; then
        # download pretrained model for PACT training
        pretrpretrained_model_url=$(func_parser_value "${lines[35]}")
        mkdir pretrained_model
        cd pretrained_model
        wget -nc ${pretrpretrained_model_url} --no-check-certificate
        cd ..
    fi
S
stephon 已提交
276 277
fi

H
HydrogenSulfate 已提交
278
if [[ ${MODE} = "serving_infer" ]]; then
S
stephon 已提交
279
    # prepare serving env
280
    python_name=$(func_parser_value "${lines[2]}")
H
fix  
HydrogenSulfate 已提交
281
    if [[ ${model_name} = "PPShiTu" ]]; then
H
debug  
HydrogenSulfate 已提交
282 283 284 285
        cls_inference_model_url=$(func_parser_value "${lines[3]}")
        cls_tar_name=$(func_get_url_file_name "${cls_inference_model_url}")
        det_inference_model_url=$(func_parser_value "${lines[4]}")
        det_tar_name=$(func_get_url_file_name "${det_inference_model_url}")
286
        cd ./deploy
H
HydrogenSulfate 已提交
287 288
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/rec/data/drink_dataset_v1.0.tar --no-check-certificate
        tar -xf drink_dataset_v1.0.tar
289 290 291 292 293
        mkdir models
        cd models
        wget -nc ${cls_inference_model_url} && tar xf ${cls_tar_name}
        wget -nc ${det_inference_model_url} && tar xf ${det_tar_name}
        cd ..
H
debug  
HydrogenSulfate 已提交
294 295 296 297
    else
        cls_inference_model_url=$(func_parser_value "${lines[3]}")
        cls_tar_name=$(func_get_url_file_name "${cls_inference_model_url}")
        cd ./deploy/paddleserving
H
debug  
HydrogenSulfate 已提交
298 299 300 301 302 303 304 305 306 307 308 309
        wget -nc ${cls_inference_model_url}
        tar xf ${cls_tar_name}

        # move '_int8' suffix in pact models
        if [[ ${cls_tar_name} =~ "pact_infer" ]]; then
            cls_inference_model_dir=${cls_tar_name%%.tar}
            cd ${cls_inference_model_dir}
            mv inference_int8.pdiparams inference.pdiparams
            mv inference_int8.pdmodel inference.pdmodel
            cd ..
        fi

H
debug  
HydrogenSulfate 已提交
310
        cd ../../
311
    fi
S
stephon 已提交
312 313 314
    unset http_proxy
    unset https_proxy
fi
L
lubin10 已提交
315

H
HydrogenSulfate 已提交
316
if [[ ${MODE} = "paddle2onnx_infer" ]]; then
L
lubin10 已提交
317 318
    # prepare paddle2onnx env
    python_name=$(func_parser_value "${lines[2]}")
H
HydrogenSulfate 已提交
319 320 321
    inference_model_url=$(func_parser_value "${lines[10]}")
    tar_name=${inference_model_url##*/}

322
    ${python_name} -m pip install paddle2onnx
L
lubin10 已提交
323
    ${python_name} -m pip install onnxruntime
324 325 326 327 328 329 330 331 332 333 334
    if [[ ${model_name} =~ "GeneralRecognition" ]]; then
        cd dataset
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
335
        rm -rf val_list.txt
336 337 338 339 340
        ln -s demo_test.txt val_list.txt
        cd ../../
        eval "wget -nc $model_url_value --no-check-certificate"
        mv general_PPLCNet_x2_5_pretrained_v1.0.pdparams GeneralRecognition_PPLCNet_x2_5_pretrained.pdparams
    fi
H
HydrogenSulfate 已提交
341 342 343 344 345 346
    cd deploy
    mkdir models
    cd models
    wget -nc ${inference_model_url}
    tar xf ${tar_name}
    cd ../../
L
lubin10 已提交
347
fi
D
dongshuilong 已提交
348

H
HydrogenSulfate 已提交
349
if [[ ${MODE} = "benchmark_train" ]]; then
D
dongshuilong 已提交
350 351
    pip install -r requirements.txt
    cd dataset
352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372

    if [[ $model_name == *GeneralRecognition* ]]; then
        rm -rf Aliproduct
        rm -rf train_reg_all_data.txt
        rm -rf demo_train
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/whole_chain/tipc_shitu_demo_data.tar --no-check-certificate
        tar -xf tipc_shitu_demo_data.tar
        ln -s tipc_shitu_demo_data Aliproduct
        ln -s tipc_shitu_demo_data/demo_train.txt train_reg_all_data.txt
        ln -s tipc_shitu_demo_data/demo_train demo_train
        cd tipc_shitu_demo_data
        ln -s demo_test.txt val_list.txt
    else
        rm -rf ILSVRC2012
        wget -nc https://paddle-imagenet-models-name.bj.bcebos.com/data/ImageNet1k/ILSVRC2012_val.tar
        tar xf ILSVRC2012_val.tar
        ln -s ILSVRC2012_val ILSVRC2012
        cd ILSVRC2012
        rm -rf train_list.txt
        ln -s val_list.txt train_list.txt
    fi
D
dongshuilong 已提交
373
    cd ../../
374

D
dongshuilong 已提交
375
fi