update MobileViTv3-v2 configs

001cdb09 · Yang Nie · Tingquan Gao · 400de784 · 001cdb09 · 001cdb09
3 changed file
--- a/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x0_5.yaml
+++ b/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x0_5.yaml
@@ -48,14 +48,13 @@ Optimizer:
  beta2: 0.999
  epsilon: 1e-8
  weight_decay: 0.05
-  no_weight_decay_name: .bias norm
  one_dim_param_no_weight_decay: True
  lr:
    # for 8 cards
    name: Cosine
    learning_rate: 0.002
    eta_min: 0.0002
-    warmup_epoch: 20  # 20000 iterations
+    warmup_epoch: 16  # 20000 iterations
    warmup_start_lr: 1e-6
    # by_epoch: True
  clip_norm: 10
@@ -107,7 +106,7 @@ DataLoader:
      name: DistributedBatchSampler
      batch_size: 128
      drop_last: False
-      shuffle: False
+      shuffle: True
    loader:
      num_workers: 4
      use_shared_memory: True

--- a/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x0_75.yaml
+++ b/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x0_75.yaml
@@ -48,14 +48,13 @@ Optimizer:
  beta2: 0.999
  epsilon: 1e-8
  weight_decay: 0.05
-  no_weight_decay_name: .bias norm
  one_dim_param_no_weight_decay: True
  lr:
    # for 8 cards
    name: Cosine
    learning_rate: 0.002
    eta_min: 0.0002
-    warmup_epoch: 20  # 20000 iterations
+    warmup_epoch: 16  # 20000 iterations
    warmup_start_lr: 1e-6
    # by_epoch: True
  clip_norm: 10
@@ -107,7 +106,7 @@ DataLoader:
      name: DistributedBatchSampler
      batch_size: 128
      drop_last: False
-      shuffle: False
+      shuffle: True
    loader:
      num_workers: 4
      use_shared_memory: True

--- a/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x1_0.yaml
+++ b/ppcls/configs/ImageNet/MobileViTv3/MobileViTv3_x1_0.yaml
@@ -48,14 +48,13 @@ Optimizer:
  beta2: 0.999
  epsilon: 1e-8
  weight_decay: 0.05
-  no_weight_decay_name: .bias norm
  one_dim_param_no_weight_decay: True
  lr:
    # for 8 cards
    name: Cosine
    learning_rate: 0.002
    eta_min: 0.0002
-    warmup_epoch: 20  # 20000 iterations
+    warmup_epoch: 16  # 20000 iterations
    warmup_start_lr: 1e-6
    # by_epoch: True
  clip_norm: 10
@@ -107,7 +106,7 @@ DataLoader:
      name: DistributedBatchSampler
      batch_size: 128
      drop_last: False
-      shuffle: False
+      shuffle: True
    loader:
      num_workers: 4
      use_shared_memory: True