mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
prenorm:False
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:CTCLabelDecode
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/ch_scene
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
loader:
shuffle:True
batch_size_per_card:128
drop_last:True
num_workers:2
Eval:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/scene_test
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
last_stage:True
prenorm:False
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:SVTRLabelDecode# SVTRLabelDecode is used for eval, please change to CTCLabelDecode when training
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/data_lmdb_release/training
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-SVTRRecResizeImg:# SVTRRecResizeImg is used for eval, please change to RecResizeImg when training
character_dict_path:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
prenorm:False
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:CTCLabelDecode
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/ch_scene
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
loader:
shuffle:True
batch_size_per_card:128
drop_last:True
num_workers:2
Eval:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/scene_test
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
prenorm:false
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:SVTRLabelDecode# SVTRLabelDecode is used for eval, please change to CTCLabelDecode when training
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/data_lmdb_release/training
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-RecAug:
-CTCLabelEncode:# Class handling label
-SVTRRecResizeImg:# SVTRRecResizeImg is used for eval, please change to RecResizeImg when training
character_dict_path:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
last_stage:True
prenorm:False
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:CTCLabelDecode
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/ch_scene
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
loader:
shuffle:True
batch_size_per_card:128
drop_last:True
num_workers:2
Eval:
dataset:
name:LMDBDataSet
data_dir:./train_data/scene_ch/scene_test
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-RecResizeImg:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order
mixer:['Local','Local','Local','Local','Local','Local','Local','Local','Global','Global','Global','Global','Global','Global','Global']# Local atten, Global atten, Conv
local_mixer:[[7,11],[7,11],[7,11]]# local mixer的范围,7表示高度的范围,11表示宽度的范围
last_stage:True
prenorm:False
Neck:
name:SequenceEncoder
encoder_type:reshape
Head:
name:CTCHead
Loss:
name:CTCLoss
PostProcess:
name:SVTRLabelDecode# SVTRLabelDecode is used for eval, please change to CTCLabelDecode when training
Metric:
name:RecMetric
main_indicator:acc
Train:
dataset:
name:LMDBDataSet
data_dir:./train_data/data_lmdb_release/training
transforms:
-DecodeImage:# load image
img_mode:BGR
channel_first:False
-CTCLabelEncode:# Class handling label
-SVTRRecResizeImg:# SVTRRecResizeImg is used for eval, please change to RecResizeImg when training
character_dict_path:
image_shape:[3,64,256]
padding:False
-KeepKeys:
keep_keys:['image','label','length']# dataloader will return list in this order