mode: 'train' ARCHITECTURE: name: 'DeiT_base_patch16_384' pretrained_model: "" model_save_dir: "./output/" classes_num: 1000 total_images: 1281167 save_interval: 1 validate: True valid_interval: 1 epochs: 120 topk: 5 image_shape: [3, 384, 384] use_mix: False ls_epsilon: -1 LEARNING_RATE: function: 'Cosine' params: lr: 0.01 OPTIMIZER: function: 'Momentum' params: momentum: 0.9 regularizer: function: 'L2' factor: 0.000100 TRAIN: batch_size: 64 num_workers: 4 file_list: "./dataset/ILSVRC2012/train_list.txt" data_dir: "./dataset/ILSVRC2012/" shuffle_seed: 0 transforms: - DecodeImage: to_rgb: True to_np: False channel_first: False - RandCropImage: size: 384 - RandFlipImage: flip_code: 1 - NormalizeImage: scale: 1./255. mean: [0.485, 0.456, 0.406] std: [0.229, 0.224, 0.225] order: '' - ToCHWImage: VALID: batch_size: 64 num_workers: 4 file_list: "./dataset/ILSVRC2012/val_list.txt" data_dir: "./dataset/ILSVRC2012/" shuffle_seed: 0 transforms: - DecodeImage: to_rgb: True to_np: False channel_first: False - ResizeImage: size: 426 - CropImage: size: 384 - NormalizeImage: scale: 1.0/255.0 mean: [0.485, 0.456, 0.406] std: [0.229, 0.224, 0.225] order: '' - ToCHWImage: