ShuffleNetV2_swish.sh 417 字节
Newer Older
R
ruri 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
##Training details
#GPU: NVIDIA® Tesla® K40 4cards 240epochs 156h
export CUDA_VISIBLE_DEVICES=0,1,2,3
export FLAGS_fast_eager_deletion_mode=1
export FLAGS_eager_delete_tensor_gb=0.0
export FLAGS_fraction_of_gpu_memory_to_use=0.98

python train.py \
	--model=ShuffleNetV2_swish \
	--batch_size=1024 \
	--model_save_dir=output/ \
	--lr_strategy=cosine_decay_warmup \
	--lr=0.5 \
	--num_epochs=240 \
	--l2_decay=4e-5