提交 37cd4ed3 编写于 作者: A andyjpaddle

delete dict90, update sar postprocess, update sar.yml

上级 ea019601
...@@ -15,7 +15,7 @@ Global: ...@@ -15,7 +15,7 @@ Global:
infer_img: infer_img:
# for data or label process # for data or label process
character_dict_path: ppocr/utils/dict90.txt character_dict_path: ppocr/utils/dict90.txt
character_type: ch character_type: EN_symbol
max_text_length: 30 max_text_length: 30
infer_mode: False infer_mode: False
use_space_char: False use_space_char: False
...@@ -47,6 +47,7 @@ Loss: ...@@ -47,6 +47,7 @@ Loss:
PostProcess: PostProcess:
name: SARLabelDecode name: SARLabelDecode
rm_symbol: True
Metric: Metric:
name: RecMetric name: RecMetric
...@@ -56,8 +57,8 @@ Train: ...@@ -56,8 +57,8 @@ Train:
dataset: dataset:
name: SimpleDataSet name: SimpleDataSet
delimiter: ' ' delimiter: ' '
label_file_list: ['/paddle/data/concat_data/train_list.txt'] label_file_list: ['./train_data/train_list.txt']
data_dir: /paddle/data/concat_data/ data_dir: ./train_data/
ratio_list: 1.0 ratio_list: 1.0
transforms: transforms:
- DecodeImage: # load image - DecodeImage: # load image
...@@ -79,7 +80,7 @@ Train: ...@@ -79,7 +80,7 @@ Train:
Eval: Eval:
dataset: dataset:
name: LMDBDataSet name: LMDBDataSet
data_dir: /paddle/data/ocr_data/evaluation/ data_dir: ./eval_data/evaluation/
transforms: transforms:
- DecodeImage: # load image - DecodeImage: # load image
img_mode: BGR img_mode: BGR
......
...@@ -526,6 +526,7 @@ class SARLabelDecode(BaseRecLabelDecode): ...@@ -526,6 +526,7 @@ class SARLabelDecode(BaseRecLabelDecode):
character_dict_path=None, character_dict_path=None,
character_type='ch', character_type='ch',
use_space_char=False, use_space_char=False,
rm_symbol=True,
**kwargs): **kwargs):
super(SARLabelDecode, self).__init__(character_dict_path, super(SARLabelDecode, self).__init__(character_dict_path,
character_type, use_space_char) character_type, use_space_char)
...@@ -572,6 +573,7 @@ class SARLabelDecode(BaseRecLabelDecode): ...@@ -572,6 +573,7 @@ class SARLabelDecode(BaseRecLabelDecode):
else: else:
conf_list.append(1) conf_list.append(1)
text = ''.join(char_list) text = ''.join(char_list)
if self.rm_symbol:
comp = re.compile('[^A-Z^a-z^0-9^\u4e00-\u9fa5]') comp = re.compile('[^A-Z^a-z^0-9^\u4e00-\u9fa5]')
text = text.lower() text = text.lower()
text = comp.sub('', text) text = comp.sub('', text)
......
0
1
2
3
4
5
6
7
8
9
a
b
c
d
e
f
g
h
i
j
k
l
m
n
o
p
q
r
s
t
u
v
w
x
y
z
A
B
C
D
E
F
G
H
I
J
K
L
M
N
O
P
Q
R
S
T
U
V
W
X
Y
Z
!
"
#
$
%
&
'
(
)
*
+
,
-
.
/
:
;
<
=
>
?
@
[
\
]
_
`
~
\ No newline at end of file
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册