pcloud_submit.sh 717 字节
Newer Older
1
#! /usr/bin/env bash
2 3 4

TRAIN_MANIFEST="cloud/cloud_manifests/cloud.manifest.train"
DEV_MANIFEST="cloud/cloud_manifests/cloud.manifest.dev"
5
CLOUD_MODEL_DIR="./checkpoints"
6
BATCH_SIZE=512
7 8 9
NUM_GPU=8
NUM_NODE=1
IS_LOCAL="True"
10

11
JOB_NAME=deepspeech-`date +%Y%m%d%H%M%S`
12
DS2_PATH=${PWD%/*}
13
cp -f  pcloud_train.sh ${DS2_PATH}
14

15
paddlecloud submit \
16
-image bootstrapper:5000/paddlepaddle/pcloud_ds2:latest \
17
-jobname ${JOB_NAME} \
18
-cpu ${NUM_GPU} \
19
-gpu ${NUM_GPU} \
20
-memory 64Gi \
21
-parallelism ${NUM_NODE} \
22 23
-pscpu 1 \
-pservers 1 \
24
-psmemory 64Gi \
25
-passes 1 \
26
-entry "sh pcloud_train.sh ${TRAIN_MANIFEST} ${DEV_MANIFEST} ${CLOUD_MODEL_DIR} ${NUM_GPU} ${BATCH_SIZE} ${IS_LOCAL}" \
27
${DS2_PATH}
28 29

rm ${DS2_PATH}/pcloud_train.sh