提交 c2802b90 编写于 作者: G gaotingquan 提交者: cuicheng01

increase bs, num_workers to speed up

上级 b2ba6994
......@@ -43,7 +43,7 @@ Optimizer:
momentum: 0.9
lr:
name: Cosine
learning_rate: 1.3
learning_rate: 7.8
warmup_epoch: 5
regularizer:
name: 'L2'
......@@ -73,11 +73,11 @@ DataLoader:
sampler:
name: DistributedBatchSampler
batch_size: 512
batch_size: 1536
drop_last: False
shuffle: True
loader:
num_workers: 4
num_workers: 20
use_shared_memory: True
Eval:
......@@ -100,7 +100,7 @@ DataLoader:
order: ''
sampler:
name: DistributedBatchSampler
batch_size: 64
batch_size: 256
drop_last: False
shuffle: False
loader:
......
......@@ -43,7 +43,7 @@ Optimizer:
momentum: 0.9
lr:
name: Cosine
learning_rate: 0.8
learning_rate: 3.2
warmup_epoch: 5
regularizer:
name: 'L2'
......@@ -73,11 +73,11 @@ DataLoader:
sampler:
name: DistributedBatchSampler
batch_size: 512
batch_size: 1024
drop_last: False
shuffle: True
loader:
num_workers: 4
num_workers: 16
use_shared_memory: True
Eval:
......@@ -100,7 +100,7 @@ DataLoader:
order: ''
sampler:
name: DistributedBatchSampler
batch_size: 64
batch_size: 256
drop_last: False
shuffle: False
loader:
......
......@@ -44,9 +44,9 @@ Optimizer:
momentum: 0.9
lr:
name: Piecewise
learning_rate: 0.1
learning_rate: 0.8
decay_epochs: [30, 60, 90]
values: [0.1, 0.01, 0.001, 0.0001]
values: [0.8, 0.08, 0.008, 0.0008]
regularizer:
name: 'L2'
coeff: 0.0001
......@@ -75,11 +75,11 @@ DataLoader:
sampler:
name: DistributedBatchSampler
batch_size: 64
batch_size: 256
drop_last: False
shuffle: True
loader:
num_workers: 4
num_workers: 16
use_shared_memory: True
Eval:
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册