run_openblas_train.sh 1004 字节
Newer Older
1 2 3
set -e

function train() {
4
  export OPENBLAS_NUM_THREADS=1
5 6 7
  topology=$1
  layer_num=$2
  bs=$3
8 9 10
  thread=`nproc`
  # each trainer_count use only 1 core to avoid conflict
  log="logs/train-${topology}-${layer_num}-${thread}openblas-${bs}.log"
11 12 13 14
  args="batch_size=${bs},layer_num=${layer_num}"
  config="${topology}.py"
  paddle train --job=time \
    --config=$config \
15
    --use_mkldnn=False \
16 17
    --use_gpu=False \
    --trainer_count=$thread \
18 19
    --log_period=3 \
    --test_period=30 \
20 21
    --config_args=$args \
    2>&1 | tee ${log} 
22 23 24 25

  avg_time=`tail ${log} -n 1 | awk -F ' ' '{print $8}' | sed 's/avg=//'`
  fps=`awk 'BEGIN{printf "%.2f",('$bs' / '$avg_time' * 1000)}'`
  echo "FPS: $fps images/sec" 2>&1 | tee -a ${log}
26 27 28 29 30 31 32 33 34 35
}

if [ ! -f "train.list" ]; then
  echo " " > train.list
fi
if [ ! -d "logs" ]; then
  mkdir logs
fi

# training benchmark
36 37 38 39
for batchsize in 64 128 256; do
  train vgg 19 $batchsize
  train resnet 50 $batchsize
  train googlenet v1 $batchsize
T
tensor-tang 已提交
40
  train alexnet 2 $batchsize
41
done