run_openblas_infer.sh 1.8 KB
Newer Older
1 2
set -e

T
tensor-tang 已提交
3 4 5 6
function clock_to_seconds() {
  hours=`echo $1 | awk -F ':' '{print $1}'`
  mins=`echo $1 | awk -F ':' '{print $2}'`
  secs=`echo $1 | awk -F ':' '{print $3}'`
T
tensor-tang 已提交
7
  echo `awk 'BEGIN{printf "%.2f",('$secs' + '$mins' * 60 + '$hours' * 3600)}'`
T
tensor-tang 已提交
8 9
}

10 11 12 13 14
function infer() {
  unset OMP_NUM_THREADS MKL_NUM_THREADS OMP_DYNAMIC KMP_AFFINITY
  topology=$1
  layer_num=$2
  bs=$3
15 16 17
  thread=`nproc`
  if [ $thread -gt $bs ]; then
    thread=$bs
18
  fi
19
  log="logs/infer-${topology}-${layer_num}-${thread}openblas-${bs}.log"
20 21 22

  models_in="models/${topology}-${layer_num}/pass-00000/"
  if [ ! -d $models_in ]; then
23 24
    echo "./run_mkl_infer.sh to save the model first"
    exit 0
25
  fi
26
  log_period=$((32 / bs))
27 28
  paddle train --job=test \
    --config="${topology}.py" \
29
    --use_mkldnn=False \
30 31
    --use_gpu=False \
    --trainer_count=$thread \
T
tensor-tang 已提交
32
    --log_period=$log_period \
33
    --config_args="batch_size=${bs},layer_num=${layer_num},is_infer=True,num_samples=256" \
34
    --init_model_path=$models_in \
T
tensor-tang 已提交
35 36
    2>&1 | tee ${log}

37
  # calculate the last 5 logs period time of 160(=32*5) samples,
T
tensor-tang 已提交
38 39 40 41 42
  # the time before are burning time.
  start=`tail ${log} -n 7 | head -n 1 | awk -F ' ' '{print $2}' | xargs`
  end=`tail ${log} -n 2 | head -n 1 | awk -F ' ' '{print $2}' | xargs`
  start_sec=`clock_to_seconds $start`
  end_sec=`clock_to_seconds $end`
43 44
  fps=`awk 'BEGIN{printf "%.2f",(160 / ('$end_sec' - '$start_sec'))}'`
  echo "Last 160 samples start: ${start}(${start_sec} sec), end: ${end}(${end_sec} sec;" >> ${log}
T
tensor-tang 已提交
45
  echo "FPS: $fps images/sec" 2>&1 | tee -a ${log}
46 47 48 49 50 51 52 53 54 55 56 57 58
}

if [ ! -f "train.list" ]; then
  echo " " > train.list
fi
if [ ! -f "test.list" ]; then
  echo " " > test.list
fi
if [ ! -d "logs" ]; then
  mkdir logs
fi

# inference benchmark
59 60
for batchsize in 1 2 4 8 16; do
  infer vgg 19 $batchsize
T
tensor-tang 已提交
61 62 63
  infer resnet 50 $batchsize 
  infer googlenet v1 $batchsize
  infer alexnet 2 $batchsize
64
done