rec_mv3_none_bilstm_ctc_simple.yml 2.3 KB
Newer Older
W
WenmuZhou 已提交
1
Global:
D
dyning 已提交
2
  use_gpu: false
W
WenmuZhou 已提交
3 4
  epoch_num: 500
  log_smooth_window: 20
D
dyning 已提交
5
  print_batch_step: 10
W
WenmuZhou 已提交
6
  save_model_dir: ./output/rec/mv3_none_bilstm_ctc/
W
WenmuZhou 已提交
7 8
  save_epoch_step: 500
  # evaluation is run every 5000 iterations after the 4000th iteration
D
dyning 已提交
9
  eval_batch_step: 127
W
WenmuZhou 已提交
10 11 12 13
  # if pretrained_model is saved in static mode, load_static_weights must set to True
  load_static_weights: True
  cal_metric_during_train: True
  pretrained_model:
W
WenmuZhou 已提交
14
  checkpoints:
W
WenmuZhou 已提交
15
  save_inference_dir:
D
dyning 已提交
16
  use_visualdl: False
W
WenmuZhou 已提交
17 18 19
  infer_img: doc/imgs_words/ch/word_1.jpg
  # for data or label process
  max_text_length: 80
W
WenmuZhou 已提交
20
  character_dict_path: ppocr/utils/ppocr_keys_v1.txt
W
WenmuZhou 已提交
21
  character_type: 'ch'
D
dyning 已提交
22
  use_space_char: False
W
WenmuZhou 已提交
23 24 25 26 27 28 29 30 31
  infer_mode: False
  use_tps: False


Optimizer:
  name: Adam
  beta1: 0.9
  beta2: 0.999
  learning_rate:
D
dyning 已提交
32
    lr: 0.001
W
WenmuZhou 已提交
33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
  regularizer:
    name: 'L2'
    factor: 0.00001

Architecture:
  type: rec
  algorithm: CRNN
  Transform:
  Backbone:
    name: MobileNetV3
    scale: 0.5
    model_name: small
    small_stride: [ 1, 2, 2, 2 ]
  Neck:
    name: SequenceEncoder
D
dyning 已提交
48 49
    encoder_type: fc
    hidden_size: 96
W
WenmuZhou 已提交
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
  Head:
    name: CTC
    fc_decay: 0.00001

Loss:
  name: CTCLoss

PostProcess:
  name: CTCLabelDecode

Metric:
  name: RecMetric
  main_indicator: acc

TRAIN:
  dataset:
D
dyning 已提交
66 67
    name: SimpleDataSet
    data_dir: ./rec
W
WenmuZhou 已提交
68
    file_list:
D
dyning 已提交
69
      - ./rec/train.txt # dataset1
W
WenmuZhou 已提交
70 71 72 73 74 75 76 77 78 79
    ratio_list: [ 0.4,0.6 ]
    transforms:
      - DecodeImage: # load image
          img_mode: BGR
          channel_first: False
      - CTCLabelEncode: # Class handling label
      - RecAug:
      - RecResizeImg:
          image_shape: [ 3,32,320 ]
      - keepKeys:
W
WenmuZhou 已提交
80
          keep_keys: [ 'image','label','length' ] # dataloader will return list in this order
W
WenmuZhou 已提交
81 82 83 84
  loader:
    batch_size: 256
    shuffle: True
    drop_last: True
W
WenmuZhou 已提交
85
    num_workers: 8
W
WenmuZhou 已提交
86 87 88

EVAL:
  dataset:
D
dyning 已提交
89 90
    name: SimpleDataSet
    data_dir: ./rec
W
WenmuZhou 已提交
91
    file_list:
D
dyning 已提交
92
      - ./rec/val.txt
W
WenmuZhou 已提交
93 94 95 96 97 98 99 100
    transforms:
      - DecodeImage: # load image
          img_mode: BGR
          channel_first: False
      - CTCLabelEncode: # Class handling label
      - RecResizeImg:
          image_shape: [ 3,32,320 ]
      - keepKeys:
W
WenmuZhou 已提交
101
          keep_keys: [ 'image','label','length' ] # dataloader will return list in this order
W
WenmuZhou 已提交
102 103 104 105
  loader:
    shuffle: False
    drop_last: False
    batch_size: 256
W
WenmuZhou 已提交
106
    num_workers: 8