pcloud_submit.sh 663 字节
Newer Older
1
TRAIN_MANIFEST="cloud/cloud.manifest.train"
2
DEV_MANIFEST="cloud/cloud.manifest.dev"
3
CLOUD_MODEL_DIR="./checkpoints"
4
BATCH_SIZE=256
5 6 7
NUM_GPU=8
NUM_NODE=1
IS_LOCAL="True"
8

9
JOB_NAME=deepspeech-`date +%Y%m%d%H%M%S`
10
DS2_PATH=${PWD%/*}
11
cp -f  pcloud_train.sh ${DS2_PATH}
12

13
paddlecloud submit \
14
-image bootstrapper:5000/paddlepaddle/pcloud_ds2:latest \
15
-jobname ${JOB_NAME} \
16
-cpu ${NUM_GPU} \
17
-gpu ${NUM_GPU} \
18
-memory 64Gi \
19
-parallelism ${NUM_NODE} \
20 21
-pscpu 1 \
-pservers 1 \
22
-psmemory 64Gi \
23
-passes 1 \
24
-entry "sh pcloud_train.sh ${TRAIN_MANIFEST} ${DEV_MANIFEST} ${CLOUD_MODEL_DIR} ${NUM_GPU} ${BATCH_SIZE} ${IS_LOCAL}" \
25
${DS2_PATH}
26 27

rm ${DS2_PATH}/pcloud_train.sh