mode: 'train' ARCHITECTURE: name: 'ViT_base_patch16_224' pretrained_model: "" model_save_dir: "./output/" classes_num: 1000 total_images: 1281167 save_interval: 1 validate: True valid_interval: 1 epochs: 120 topk: 5 image_shape: [3, 224, 224] use_mix: False ls_epsilon: -1 LEARNING_RATE: function: 'Cosine' params: lr: 0.005 OPTIMIZER: function: 'Momentum' params: momentum: 0.9 regularizer: function: 'L2' factor: 0.000100 TRAIN: batch_size: 48 num_workers: 4 file_list: "./dataset/ILSVRC2012/train_list.txt" data_dir: "./dataset/ILSVRC2012/" shuffle_seed: 0 transforms: - DecodeImage: to_rgb: True to_np: False channel_first: False - RandCropImage: size: 224 - RandFlipImage: flip_code: 1 - NormalizeImage: scale: 1./255. mean: [0.5, 0.5, 0.5] std: [0.5, 0.5, 0.5] order: '' - ToCHWImage: VALID: batch_size: 48 num_workers: 4 file_list: "./dataset/ILSVRC2012/val_list.txt" data_dir: "./dataset/ILSVRC2012/" shuffle_seed: 0 transforms: - DecodeImage: to_rgb: True to_np: False channel_first: False - ResizeImage: size: 248 - CropImage: size: 224 - NormalizeImage: scale: 1.0/255.0 mean: [0.5, 0.5, 0.5] std: [0.5, 0.5, 0.5] order: '' - ToCHWImage: