From d1b31bf85cd6e23c8a09758ea6ca03938209ed69 Mon Sep 17 00:00:00 2001
From: WenmuZhou <572459439@qq.com>
Date: Mon, 4 Jul 2022 10:22:25 +0000
Subject: [PATCH] add ref

---
 configs/table/table_master.yml                |  64 +++++-----
 doc/doc_ch/algorithm_det_fcenet.md            |  22 ++--
 doc/doc_ch/algorithm_overview.md              |  16 ++-
 doc/doc_ch/algorithm_table_master.md          | 114 ++++++++++++++++++
 doc/doc_en/algorithm_overview_en.md           |  13 ++
 doc/doc_en/algorithm_table_master_en.md       | 112 +++++++++++++++++
 ppocr/data/imaug/label_ops.py                 |   9 ++
 ppocr/losses/table_master_loss.py             |   5 +
 .../modeling/backbones/table_master_resnet.py |   4 +
 ppocr/modeling/heads/table_master_head.py     |   5 +
 ppocr/postprocess/__init__.py                 |   2 +-
 ppstructure/docs/models_list.md               |   2 +-
 12 files changed, 319 insertions(+), 49 deletions(-)
 create mode 100644 doc/doc_ch/algorithm_table_master.md
 create mode 100644 doc/doc_en/algorithm_table_master_en.md

diff --git a/configs/table/table_master.yml b/configs/table/table_master.yml
index 9dfc0e27..cfd98346 100755
--- a/configs/table/table_master.yml
+++ b/configs/table/table_master.yml
@@ -2,21 +2,19 @@ Global:
   use_gpu: true
   epoch_num: 17
   log_smooth_window: 20
-  print_batch_step: 5
+  print_batch_step: 100
   save_model_dir: ./output/table_master/
   save_epoch_step: 17
-  # evaluation is run every 400 iterations after the 0th iteration
-  eval_batch_step: [0, 400]
-  cal_metric_during_train: True
-  pretrained_model:
-  checkpoints:
-  save_inference_dir:
-  use_visualdl: False
+  eval_batch_step: [0,  6259]
+  cal_metric_during_train: true
+  pretrained_model: null
+  checkpoints: 
+  save_inference_dir: output/table_master/infer
+  use_visualdl: false
   infer_img: ppstructure/docs/table/table.jpg
-  save_res_path: output/table_master
-  # for data or label process
+  save_res_path: ./output/table_master
   character_dict_path: ppocr/utils/dict/table_master_structure_dict.txt
-  infer_mode: False
+  infer_mode: false
   max_text_length: 500
   process_total_num: 0
   process_cut_num: 0
@@ -33,8 +31,8 @@ Optimizer:
     gamma: 0.1
     warmup_epoch: 0.02
   regularizer:
-    name: 'L2'
-    factor: 0.00000
+    name: L2
+    factor: 0.0
 
 Architecture:
   model_type: table
@@ -67,15 +65,15 @@ PostProcess:
 Metric:
   name: TableMetric
   main_indicator: acc
-  compute_bbox_metric: true # cost many time, set False for training
+  compute_bbox_metric: False
 
 Train:
   dataset:
     name: PubTabDataSet
-    data_dir: /home/zhoujun20/table/PubTabNe/pubtabnet/train/
-    label_file_list: [/home/zhoujun20/table/PubTabNe/pubtabnet/PubTabNet_2.0.0_train.jsonl]
+    data_dir: train_data/table/pubtabnet/train/
+    label_file_list: [train_data/table/pubtabnet/PubTabNet_2.0.0_train.jsonl]
     transforms:
-      - DecodeImage: # load image
+      - DecodeImage:
           img_mode: BGR
           channel_first: False
       - TableMasterLabelEncode:
@@ -88,20 +86,20 @@ Train:
       - PaddingTableImage:
           size: [480, 480]
       - TableBoxEncode:
-          use_xywh: true
+          use_xywh: True
       - NormalizeImage:
           scale: 1./255.
           mean: [0.5, 0.5, 0.5]
           std: [0.5, 0.5, 0.5]
-          order: 'hwc'
-      - ToCHWImage:
+          order: hwc
+      - ToCHWImage: null
       - KeepKeys:
-          keep_keys: ['image', 'structure', 'bboxes', 'bbox_masks','shape']
+          keep_keys: [image, structure, bboxes, bbox_masks, shape]
   loader:
     shuffle: True
-    batch_size_per_card: 8
+    batch_size_per_card: 10
     drop_last: True
-    num_workers: 1
+    num_workers: 8
 
 Eval:
   dataset:
@@ -109,7 +107,7 @@ Eval:
     data_dir: /home/zhoujun20/table/PubTabNe/pubtabnet/val/
     label_file_list: [/home/zhoujun20/table/PubTabNe/pubtabnet/val_500.jsonl]
     transforms:
-      - DecodeImage: # load image
+      - DecodeImage:
           img_mode: BGR
           channel_first: False
       - TableMasterLabelEncode:
@@ -120,19 +118,19 @@ Eval:
           max_len: 480
           resize_bboxes: True
       - PaddingTableImage:
-          size: [ 480, 480 ]
+          size: [480, 480]
       - TableBoxEncode:
-          use_xywh: true
+          use_xywh: True
       - NormalizeImage:
           scale: 1./255.
-          mean: [ 0.5, 0.5, 0.5 ]
-          std: [ 0.5, 0.5, 0.5 ]
-          order: 'hwc'
-      - ToCHWImage:
+          mean: [0.5, 0.5, 0.5]
+          std: [0.5, 0.5, 0.5]
+          order: hwc
+      - ToCHWImage: null
       - KeepKeys:
-          keep_keys: [ 'image', 'structure', 'bboxes', 'bbox_masks','shape' ]
+          keep_keys: [image, structure, bboxes, bbox_masks, shape]
   loader:
     shuffle: False
     drop_last: False
-    batch_size_per_card: 2
-    num_workers: 8
+    batch_size_per_card: 10
+    num_workers: 8
\ No newline at end of file
diff --git a/doc/doc_ch/algorithm_det_fcenet.md b/doc/doc_ch/algorithm_det_fcenet.md
index bd2e7342..a70caa29 100644
--- a/doc/doc_ch/algorithm_det_fcenet.md
+++ b/doc/doc_ch/algorithm_det_fcenet.md
@@ -1,17 +1,15 @@
 # FCENet
 
-- [1. ç®—æ³•ç®€ä»‹](#1)
-- [2. çŽ¯å¢ƒé…ç½®](#2)
-- [3. æ¨¡åž‹è®ç»ƒã€è¯„ä¼°ã€é¢„æµ‹](#3)
-    - [3.1 è®ç»ƒ](#3-1)
-    - [3.2 è¯„ä¼°](#3-2)
-    - [3.3 é¢„æµ‹](#3-3)
-- [4. æŽ¨ç†éƒ¨ç½²](#4)
-    - [4.1 PythonæŽ¨ç†](#4-1)
-    - [4.2 C++æŽ¨ç†](#4-2)
-    - [4.3 ServingæœåŠ¡åŒ–éƒ¨ç½²](#4-3)
-    - [4.4 æ›´å¤šæŽ¨ç†éƒ¨ç½²](#4-4)
-- [5. FAQ](#5)
+- [1. ç®—æ³•ç®€ä»‹](#1-ç®—æ³•ç®€ä»‹)
+- [2. çŽ¯å¢ƒé…ç½®](#2-çŽ¯å¢ƒé…ç½®)
+- [3. æ¨¡åž‹è®ç»ƒã€è¯„ä¼°ã€é¢„æµ‹](#3-æ¨¡åž‹è®ç»ƒè¯„ä¼°é¢„æµ‹)
+- [4. æŽ¨ç†éƒ¨ç½²](#4-æŽ¨ç†éƒ¨ç½²)
+  - [4.1 PythonæŽ¨ç†](#41-pythonæŽ¨ç†)
+  - [4.2 C++æŽ¨ç†](#42-cæŽ¨ç†)
+  - [4.3 ServingæœåŠ¡åŒ–éƒ¨ç½²](#43-servingæœåŠ¡åŒ–éƒ¨ç½²)
+  - [4.4 æ›´å¤šæŽ¨ç†éƒ¨ç½²](#44-æ›´å¤šæŽ¨ç†éƒ¨ç½²)
+- [5. FAQ](#5-faq)
+- [å¼•ç”¨](#å¼•ç”¨)
 
 <a name="1"></a>
 ## 1. ç®—æ³•ç®€ä»‹
diff --git a/doc/doc_ch/algorithm_overview.md b/doc/doc_ch/algorithm_overview.md
index ef96f6ec..84af5fdc 100755
--- a/doc/doc_ch/algorithm_overview.md
+++ b/doc/doc_ch/algorithm_overview.md
@@ -1,9 +1,10 @@
 # OCRç®—æ³•
 
 - [1. ä¸¤é˜¶æ®µç®—æ³•](#1-ä¸¤é˜¶æ®µç®—æ³•)
-    - [1.1 æ–‡æœ¬æ£€æµ‹ç®—æ³•](#11-æ–‡æœ¬æ£€æµ‹ç®—æ³•)
-    - [1.2 æ–‡æœ¬è¯†åˆ«ç®—æ³•](#12-æ–‡æœ¬è¯†åˆ«ç®—æ³•)
+  - [1.1 æ–‡æœ¬æ£€æµ‹ç®—æ³•](#11-æ–‡æœ¬æ£€æµ‹ç®—æ³•)
+  - [1.2 æ–‡æœ¬è¯†åˆ«ç®—æ³•](#12-æ–‡æœ¬è¯†åˆ«ç®—æ³•)
 - [2. ç«¯åˆ°ç«¯ç®—æ³•](#2-ç«¯åˆ°ç«¯ç®—æ³•)
+- [3. è¡¨æ ¼è¯†åˆ«ç®—æ³•](#3-è¡¨æ ¼è¯†åˆ«ç®—æ³•)
 
 
 æœ¬æ–‡ç»™å‡ºäº†PaddleOCRå·²æ”¯æŒçš„OCRç®—æ³•åˆ—è¡¨ï¼Œä»¥åŠæ¯ä¸ªç®—æ³•åœ¨**è‹±æ–‡å…¬å¼€æ•°æ®é›†**ä¸Šçš„æ¨¡åž‹å’ŒæŒ‡æ ‡ï¼Œä¸»è¦ç”¨äºŽç®—æ³•ç®€ä»‹å’Œç®—æ³•æ€§èƒ½å¯¹æ¯”ï¼Œæ›´å¤šåŒ…æ‹¬ä¸æ–‡åœ¨å†…çš„å…¶ä»–æ•°æ®é›†ä¸Šçš„æ¨¡åž‹è¯·å‚è€ƒ[PP-OCR v2.0 ç³»åˆ—æ¨¡åž‹ä¸‹è½½](./models_list.md)ã€‚
@@ -96,3 +97,14 @@
 
 å·²æ”¯æŒçš„ç«¯åˆ°ç«¯OCRç®—æ³•åˆ—è¡¨ï¼ˆæˆ³é“¾æŽ¥èŽ·å–ä½¿ç”¨æ•™ç¨‹ï¼‰ï¼š
 - [x]  [PGNet](./algorithm_e2e_pgnet.md)
+
+## 3. è¡¨æ ¼è¯†åˆ«ç®—æ³•
+
+å·²æ”¯æŒçš„è¡¨æ ¼è¯†åˆ«ç®—æ³•åˆ—è¡¨ï¼ˆæˆ³é“¾æŽ¥èŽ·å–ä½¿ç”¨æ•™ç¨‹ï¼‰ï¼š
+- [x]  [TableMaster](./algorithm_table_master.md)
+
+åœ¨PubTabNetè¡¨æ ¼è¯†åˆ«å…¬å¼€æ•°æ®é›†ä¸Šï¼Œç®—æ³•æ•ˆæžœå¦‚ä¸‹ï¼š
+
+|æ¨¡åž‹|éª¨å¹²ç½‘ç»œ|é…ç½®æ–‡ä»¶|acc|ä¸‹è½½é“¾æŽ¥|
+|---|---|---|---|---|
+|TableMaster|TableResNetExtra|[configs/table/table_master.yml](../../configs/table/table_master.yml)|77.47%|[è®ç»ƒæ¨¡åž‹]|[è®ç»ƒæ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_train.tar)/[æŽ¨ç†æ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_infer.tar)|
diff --git a/doc/doc_ch/algorithm_table_master.md b/doc/doc_ch/algorithm_table_master.md
new file mode 100644
index 00000000..6bfd0f36
--- /dev/null
+++ b/doc/doc_ch/algorithm_table_master.md
@@ -0,0 +1,114 @@
+# è¡¨æ ¼è¯†åˆ«ç®—æ³•-TableMASTER
+
+- [1. ç®—æ³•ç®€ä»‹](#1-ç®—æ³•ç®€ä»‹)
+- [2. çŽ¯å¢ƒé…ç½®](#2-çŽ¯å¢ƒé…ç½®)
+- [3. æ¨¡åž‹è®ç»ƒã€è¯„ä¼°ã€é¢„æµ‹](#3-æ¨¡åž‹è®ç»ƒè¯„ä¼°é¢„æµ‹)
+- [4. æŽ¨ç†éƒ¨ç½²](#4-æŽ¨ç†éƒ¨ç½²)
+  - [4.1 PythonæŽ¨ç†](#41-pythonæŽ¨ç†)
+  - [4.2 C++æŽ¨ç†éƒ¨ç½²](#42-cæŽ¨ç†éƒ¨ç½²)
+  - [4.3 ServingæœåŠ¡åŒ–éƒ¨ç½²](#43-servingæœåŠ¡åŒ–éƒ¨ç½²)
+  - [4.4 æ›´å¤šæŽ¨ç†éƒ¨ç½²](#44-æ›´å¤šæŽ¨ç†éƒ¨ç½²)
+- [5. FAQ](#5-faq)
+- [å¼•ç”¨](#å¼•ç”¨)
+
+<a name="1"></a>
+## 1. ç®—æ³•ç®€ä»‹
+
+è®ºæ–‡ä¿¡æ¯ï¼š
+> [TableMaster: PINGAN-VCGROUPâ€™S SOLUTION FOR ICDAR 2021 COMPETITION ON SCIENTIFIC LITERATURE PARSING TASK B: TABLE RECOGNITION TO HTML](https://arxiv.org/pdf/2105.01848.pdf)
+> Ye, Jiaquan and Qi, Xianbiao and He, Yelin and Chen, Yihao and Gu, Dengyi and Gao, Peng and Xiao, Rong
+> 2021
+
+åœ¨PubTabNetè¡¨æ ¼è¯†åˆ«å…¬å¼€æ•°æ®é›†ä¸Šï¼Œç®—æ³•å¤çŽ°æ•ˆæžœå¦‚ä¸‹ï¼š
+
+|æ¨¡åž‹|éª¨å¹²ç½‘ç»œ|é…ç½®æ–‡ä»¶|acc|ä¸‹è½½é“¾æŽ¥|
+| --- | --- | --- | --- | --- |
+|TableMaster|TableResNetExtra|[configs/table/table_master.yml](../../configs/table/table_master.yml)|77.47%|[è®ç»ƒæ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_train.tar)/[æŽ¨ç†æ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_infer.tar)|
+
+
+<a name="2"></a>
+## 2. çŽ¯å¢ƒé…ç½®
+è¯·å…ˆå‚è€ƒ[ã€Šè¿è¡ŒçŽ¯å¢ƒå‡†å¤‡ã€‹](./environment.md)é…ç½®PaddleOCRè¿è¡ŒçŽ¯å¢ƒï¼Œå‚è€ƒ[ã€Šé¡¹ç›®å…‹éš†ã€‹](./clone.md)å…‹éš†é¡¹ç›®ä»£ç ã€‚
+
+
+<a name="3"></a>
+## 3. æ¨¡åž‹è®ç»ƒã€è¯„ä¼°ã€é¢„æµ‹
+
+ä¸Šè¿°TableMasteræ¨¡åž‹ä½¿ç”¨PubTabNetè¡¨æ ¼è¯†åˆ«å…¬å¼€æ•°æ®é›†è®ç»ƒå¾—åˆ°ï¼Œæ•°æ®é›†ä¸‹è½½å¯å‚è€ƒ [table_datasets](./dataset/table_datasets.md)ã€‚
+
+æ•°æ®ä¸‹è½½å®ŒæˆåŽï¼Œè¯·å‚è€ƒ[æ–‡æœ¬è¯†åˆ«æ•™ç¨‹](./recognition.md)è¿›è¡Œè®ç»ƒã€‚PaddleOCRå¯¹ä»£ç è¿›è¡Œäº†æ¨¡å—åŒ–ï¼Œè®ç»ƒä¸åŒçš„æ¨¡åž‹åªéœ€è¦**æ›´æ¢é…ç½®æ–‡ä»¶**å³å¯ã€‚
+
+<a name="4"></a>
+## 4. æŽ¨ç†éƒ¨ç½²
+
+<a name="4-1"></a>
+### 4.1 PythonæŽ¨ç†
+é¦–å…ˆå°†è®ç»ƒå¾—åˆ°bestæ¨¡åž‹ï¼Œè½¬æ¢æˆinference modelã€‚ä»¥åŸºäºŽTableResNetExtraéª¨å¹²ç½‘ç»œï¼Œåœ¨PubTabNetæ•°æ®é›†è®ç»ƒçš„æ¨¡åž‹ä¸ºä¾‹([æ¨¡åž‹ä¸‹è½½åœ°å€](https://paddleocr.bj.bcebos.com/contribution/table_master.tar))ï¼Œå¯ä»¥ä½¿ç”¨å¦‚ä¸‹å‘½ä»¤è¿›è¡Œè½¬æ¢ï¼š
+
+```shell
+# æ³¨æ„å°†pretrained_modelçš„è·¯å¾„è®¾ç½®ä¸ºæœ¬åœ°è·¯å¾„ã€‚
+python3 tools/export_model.py -c configs/table/table_master.yml -o Global.pretrained_model=output/table_master/best_accuracy Global.save_inference_dir=./inference/table_master
+```
+
+**æ³¨æ„ï¼š**
+- å¦‚æžœæ‚¨æ˜¯åœ¨è‡ªå·±çš„æ•°æ®é›†ä¸Šè®ç»ƒçš„æ¨¡åž‹ï¼Œå¹¶ä¸”è°ƒæ•´äº†å—å…¸æ–‡ä»¶ï¼Œè¯·æ³¨æ„ä¿®æ”¹é…ç½®æ–‡ä»¶ä¸çš„`character_dict_path`æ˜¯å¦ä¸ºæ‰€æ£ç¡®çš„å—å…¸æ–‡ä»¶ã€‚
+
+è½¬æ¢æˆåŠŸåŽï¼Œåœ¨ç›®å½•ä¸‹æœ‰ä¸‰ä¸ªæ–‡ä»¶ï¼š
+```
+/inference/table_master/
+    â”œâ”€â”€ inference.pdiparams         # è¯†åˆ«inferenceæ¨¡åž‹çš„å‚æ•°æ–‡ä»¶
+    â”œâ”€â”€ inference.pdiparams.info    # è¯†åˆ«inferenceæ¨¡åž‹çš„å‚æ•°ä¿¡æ¯ï¼Œå¯å¿½ç•¥
+    â””â”€â”€ inference.pdmodel           # è¯†åˆ«inferenceæ¨¡åž‹çš„programæ–‡ä»¶
+```
+
+
+æ‰§è¡Œå¦‚ä¸‹å‘½ä»¤è¿›è¡Œæ¨¡åž‹æŽ¨ç†ï¼š
+
+```shell
+cd ppstructure/
+python3.7 table/predict_structure.py --table_model_dir=../output/table_master/table_structure_tablemaster_infer/ --table_algorithm=TableMaster --table_char_dict_path=../ppocr/utils/dict/table_master_structure_dict.txt --table_max_len=480 --image_dir=docs/table/table.jpg
+# é¢„æµ‹æ–‡ä»¶å¤¹ä¸‹æ‰€æœ‰å›¾åƒæ—¶ï¼Œå¯ä¿®æ”¹image_dirä¸ºæ–‡ä»¶å¤¹ï¼Œå¦‚ --image_dir='docs/table'ã€‚
+```
+
+æ‰§è¡Œå‘½ä»¤åŽï¼Œä¸Šé¢å›¾åƒçš„é¢„æµ‹ç»“æžœï¼ˆç»“æž„ä¿¡æ¯å’Œè¡¨æ ¼ä¸æ¯ä¸ªå•å…ƒæ ¼çš„åæ ‡ï¼‰ä¼šæ‰“å°åˆ°å±å¹•ä¸Šï¼ŒåŒæ—¶ä¼šä¿å˜å•å…ƒæ ¼åæ ‡çš„å¯è§†åŒ–ç»“æžœã€‚ç¤ºä¾‹å¦‚ä¸‹ï¼š
+ç»“æžœå¦‚ä¸‹ï¼š
+```shell
+[2022/06/16 13:06:54] ppocr INFO: result: ['<html>', '<body>', '<table>', '<thead>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '</thead>', '<tbody>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '</tbody>', '</table>', '</body>', '</html>'], [[72.17591094970703, 10.759100914001465, 60.29658508300781, 16.6805362701416], [161.85562133789062, 10.884308815002441, 14.9495210647583, 16.727018356323242], [277.79876708984375, 29.54340362548828, 31.490320205688477, 18.143272399902344],
+...
+[336.11724853515625, 280.3601989746094, 39.456939697265625, 18.121286392211914]]
+[2022/06/16 13:06:54] ppocr INFO: save vis result to ./output/table.jpg
+[2022/06/16 13:06:54] ppocr INFO: Predict time of docs/table/table.jpg: 17.36806297302246
+```
+
+**æ³¨æ„**ï¼š
+
+- TableMasteråœ¨æŽ¨ç†æ—¶æ¯”è¾ƒæ…¢ï¼Œå»ºè®®ä½¿ç”¨GPUè¿›è¡Œä½¿ç”¨ã€‚
+
+<a name="4-2"></a>
+### 4.2 C++æŽ¨ç†éƒ¨ç½²
+
+ç”±äºŽC++é¢„å¤„ç†åŽå¤„ç†è¿˜æœªæ”¯æŒTableMasterï¼Œæ‰€ä»¥æš‚æœªæ”¯æŒ
+
+<a name="4-3"></a>
+### 4.3 ServingæœåŠ¡åŒ–éƒ¨ç½²
+
+æš‚ä¸æ”¯æŒ
+
+<a name="4-4"></a>
+### 4.4 æ›´å¤šæŽ¨ç†éƒ¨ç½²
+
+æš‚ä¸æ”¯æŒ
+
+<a name="5"></a>
+## 5. FAQ
+
+## å¼•ç”¨
+
+```bibtex
+@article{ye2021pingan,
+  title={PingAn-VCGroup's Solution for ICDAR 2021 Competition on Scientific Literature Parsing Task B: Table Recognition to HTML},
+  author={Ye, Jiaquan and Qi, Xianbiao and He, Yelin and Chen, Yihao and Gu, Dengyi and Gao, Peng and Xiao, Rong},
+  journal={arXiv preprint arXiv:2105.01848},
+  year={2021}
+}
+```
diff --git a/doc/doc_en/algorithm_overview_en.md b/doc/doc_en/algorithm_overview_en.md
index bc96cdf2..cd277c74 100755
--- a/doc/doc_en/algorithm_overview_en.md
+++ b/doc/doc_en/algorithm_overview_en.md
@@ -4,6 +4,7 @@
   * [1.1 Text Detection Algorithms](#11)
   * [1.2 Text Recognition Algorithms](#12)
 - [2. End-to-end Algorithms](#2)
+- [3. Table Recognition Algorithms](#3)
 
 
 This tutorial lists the OCR algorithms supported by PaddleOCR, as well as the models and metrics of each algorithm on **English public datasets**. It is mainly used for algorithm introduction and algorithm performance comparison. For more models on other datasets including Chinese, please refer to [PP-OCR v2.0 models list](./models_list_en.md).
@@ -95,3 +96,15 @@ Refer to [DTRB](https://arxiv.org/abs/1904.01906), the training and evaluation r
 
 Supported end-to-end algorithms (Click the link to get the tutorial):
 - [x]  [PGNet](./algorithm_e2e_pgnet_en.md)
+
+<a name="3"></a>
+## 3. Table Recognition Algorithms
+
+Supported table recognition algorithms (Click the link to get the tutorial):
+- [x]  [TableMaster](./algorithm_table_master_en.md)
+
+On the PubTabNet dataset, the algorithm result is as follows:
+
+|Model|Backbone|Config|Acc|Download link|
+|---|---|---|---|---|
+|TableMaster|TableResNetExtra|[configs/table/table_master.yml](../../configs/table/table_master.yml)|77.47%|[è®ç»ƒæ¨¡åž‹]|[è®ç»ƒæ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_train.tar)/[æŽ¨ç†æ¨¡åž‹](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_infer.tar)|
diff --git a/doc/doc_en/algorithm_table_master_en.md b/doc/doc_en/algorithm_table_master_en.md
new file mode 100644
index 00000000..a557a609
--- /dev/null
+++ b/doc/doc_en/algorithm_table_master_en.md
@@ -0,0 +1,112 @@
+# Torm Recognition Algorithm-TableMASTER
+
+- [1. Introduction](#1-introduction)
+- [2. Environment](#2-environment)
+- [3. Model Training / Evaluation / Prediction](#3-model-training--evaluation--prediction)
+- [4. Inference and Deployment](#4-inference-and-deployment)
+  - [4.1 Python Inference](#41-python-inference)
+  - [4.2 C++ Inference](#42-c-inference)
+  - [4.3 Serving](#43-serving)
+  - [4.4 More](#44-more)
+- [5. FAQ](#5-faq)
+- [Citation](#citation)
+
+<a name="1"></a>
+## 1. Introduction
+
+Paper:
+> [TableMaster: PINGAN-VCGROUPâ€™S SOLUTION FOR ICDAR 2021 COMPETITION ON SCIENTIFIC LITERATURE PARSING TASK B: TABLE RECOGNITION TO HTML](https://arxiv.org/pdf/2105.01848.pdf)
+> Ye, Jiaquan and Qi, Xianbiao and He, Yelin and Chen, Yihao and Gu, Dengyi and Gao, Peng and Xiao, Rong
+> 2021
+
+
+On the PubTabNet table recognition public data set, the algorithm reproduction acc is as follows:
+
+|Model|Backbone|Cnnfig|Acc|Download link|
+| --- | --- | --- | --- | --- |
+|TableMaster|TableResNetExtra|[configs/table/table_master.yml](../../configs/table/table_master.yml)|77.47%|[train model](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_train.tar)/[inference model](https://paddleocr.bj.bcebos.com/ppstructure/models/tablemaster/table_structure_tablemaster_infer.tar)|
+
+
+<a name="2"></a>
+## 2. Environment
+Please refer to ["Environment Preparation"](./environment_en.md) to configure the PaddleOCR environment, and refer to ["Project Clone"](./clone_en.md) to clone the project code.
+
+
+<a name="3"></a>
+## 3. Model Training / Evaluation / Prediction
+
+The above TableMaster model is trained using the PubTabNet table recognition public dataset. For the download of the dataset, please refer to [table_datasets](./dataset/table_datasets_en.md).
+
+After the data download is complete, please refer to [Text Recognition Training Tutorial](./recognition_en.md) for training. PaddleOCR has modularized the code structure, so that you only need to **replace the configuration file** to train different models.
+
+
+<a name="4"></a>
+## 4. Inference and Deployment
+
+<a name="4-1"></a>
+### 4.1 Python Inference
+
+First, convert the model saved in the TableMaster table recognition training process into an inference model. Taking the model based on the TableResNetExtra backbone network and trained on the PubTabNet dataset as example ([model download link](https://paddleocr.bj.bcebos.com/contribution/table_master.tar)), you can use the following command to convert:
+
+
+```shell
+python3 tools/export_model.py -c configs/table/table_master.yml -o Global.pretrained_model=output/table_master/best_accuracy Global.save_inference_dir=./inference/table_master
+```
+
+**Note: **
+- If you trained the model on your own dataset and adjusted the dictionary file, please pay attention to whether the `character_dict_path` in the modified configuration file is the correct dictionary file
+
+
+Execute the following command for model inference:
+
+```shell
+cd ppstructure/
+# When predicting all images in a folder, you can modify image_dir to a folder, such as --image_dir='docs/table'.
+python3.7 table/predict_structure.py --table_model_dir=../output/table_master/table_structure_tablemaster_infer/ --table_algorithm=TableMaster --table_char_dict_path=../ppocr/utils/dict/table_master_structure_dict.txt --table_max_len=480 --image_dir=docs/table/table.jpg
+
+```
+
+After executing the command, the prediction results of the above image (structural information and the coordinates of each cell in the table) are printed to the screen, and the visualization of the cell coordinates is also saved. An example is as follows:
+
+resultï¼š
+```shell
+[2022/06/16 13:06:54] ppocr INFO: result: ['<html>', '<body>', '<table>', '<thead>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '</thead>', '<tbody>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '<tr>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '<td></td>', '</tr>', '</tbody>', '</table>', '</body>', '</html>'], [[72.17591094970703, 10.759100914001465, 60.29658508300781, 16.6805362701416], [161.85562133789062, 10.884308815002441, 14.9495210647583, 16.727018356323242], [277.79876708984375, 29.54340362548828, 31.490320205688477, 18.143272399902344],
+...
+[336.11724853515625, 280.3601989746094, 39.456939697265625, 18.121286392211914]]
+[2022/06/16 13:06:54] ppocr INFO: save vis result to ./output/table.jpg
+[2022/06/16 13:06:54] ppocr INFO: Predict time of docs/table/table.jpg: 17.36806297302246
+```
+
+**Note**:
+
+- TableMaster is relatively slow during inference, and it is recommended to use GPU for use.
+
+<a name="4-2"></a>
+### 4.2 C++ Inference
+
+Since the post-processing is not written in CPP, the TableMaster does not support CPP inference.
+
+
+<a name="4-3"></a>
+### 4.3 Serving
+
+Not supported
+
+<a name="4-4"></a>
+### 4.4 More
+
+Not supported
+
+<a name="5"></a>
+## 5. FAQ
+
+## Citation
+
+```bibtex
+@article{ye2021pingan,
+  title={PingAn-VCGroup's Solution for ICDAR 2021 Competition on Scientific Literature Parsing Task B: Table Recognition to HTML},
+  author={Ye, Jiaquan and Qi, Xianbiao and He, Yelin and Chen, Yihao and Gu, Dengyi and Gao, Peng and Xiao, Rong},
+  journal={arXiv preprint arXiv:2105.01848},
+  year={2021}
+}
+```
diff --git a/ppocr/data/imaug/label_ops.py b/ppocr/data/imaug/label_ops.py
index 00792701..96f3c986 100644
--- a/ppocr/data/imaug/label_ops.py
+++ b/ppocr/data/imaug/label_ops.py
@@ -670,6 +670,10 @@ class TableLabelEncode(AttnLabelEncode):
         return data
 
     def _merge_no_span_structure(self, structure):
+        """
+        This fun code is refer from:
+        https://github.com/JiaquanYe/TableMASTER-mmocr/blob/master/table_recognition/data_preprocess.py
+        """
         new_structure = []
         i = 0
         while i < len(structure):
@@ -682,6 +686,11 @@ class TableLabelEncode(AttnLabelEncode):
         return new_structure
 
     def _replace_empty_cell_token(self, token_list, cells):
+        """
+        This fun code is refer from:
+        https://github.com/JiaquanYe/TableMASTER-mmocr/blob/master/table_recognition/data_preprocess.py
+        """
+
         bbox_idx = 0
         add_empty_bbox_token_list = []
         for token in token_list:
diff --git a/ppocr/losses/table_master_loss.py b/ppocr/losses/table_master_loss.py
index 50a773dd..216c4e52 100644
--- a/ppocr/losses/table_master_loss.py
+++ b/ppocr/losses/table_master_loss.py
@@ -11,6 +11,11 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""
+This fun code is refer from:
+https://github.com/JiaquanYe/TableMASTER-mmocr/tree/master/mmocr/models/textrecog/losses
+"""
+
 import paddle
 from paddle import nn
 
diff --git a/ppocr/modeling/backbones/table_master_resnet.py b/ppocr/modeling/backbones/table_master_resnet.py
index 82b4f37a..f1c506ca 100644
--- a/ppocr/modeling/backbones/table_master_resnet.py
+++ b/ppocr/modeling/backbones/table_master_resnet.py
@@ -11,6 +11,10 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""
+This fun code is refer from:
+https://github.com/JiaquanYe/TableMASTER-mmocr/blob/master/mmocr/models/textrecog/backbones/table_resnet_extra.py
+"""
 
 import paddle
 import paddle.nn as nn
diff --git a/ppocr/modeling/heads/table_master_head.py b/ppocr/modeling/heads/table_master_head.py
index 4da6e9b5..887630a8 100644
--- a/ppocr/modeling/heads/table_master_head.py
+++ b/ppocr/modeling/heads/table_master_head.py
@@ -11,6 +11,11 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+"""
+This fun code is refer from:
+https://github.com/JiaquanYe/TableMASTER-mmocr/blob/master/mmocr/models/textrecog/decoders/master_decoder.py
+"""
+
 import copy
 import math
 import paddle
diff --git a/ppocr/postprocess/__init__.py b/ppocr/postprocess/__init__.py
index 26a23f1e..1d414eb2 100644
--- a/ppocr/postprocess/__init__.py
+++ b/ppocr/postprocess/__init__.py
@@ -26,7 +26,7 @@ from .east_postprocess import EASTPostProcess
 from .sast_postprocess import SASTPostProcess
 from .fce_postprocess import FCEPostProcess
 from .rec_postprocess import CTCLabelDecode, AttnLabelDecode, SRNLabelDecode, \
-    DistillationCTCLabelDecode, TableLabelDecode, NRTRLabelDecode, SARLabelDecode, \
+    DistillationCTCLabelDecode, NRTRLabelDecode, SARLabelDecode, \
     SEEDLabelDecode, PRENLabelDecode, ViTSTRLabelDecode, ABINetLabelDecode
 from .cls_postprocess import ClsPostProcess
 from .pg_postprocess import PGPostProcess
diff --git a/ppstructure/docs/models_list.md b/ppstructure/docs/models_list.md
index dabce3a5..42d44009 100644
--- a/ppstructure/docs/models_list.md
+++ b/ppstructure/docs/models_list.md
@@ -35,7 +35,7 @@
 
 |æ¨¡åž‹åç§°|æ¨¡åž‹ç®€ä»‹|æŽ¨ç†æ¨¡åž‹å¤§å°|ä¸‹è½½åœ°å€|
 | --- | --- | --- | --- |
-|en_ppocr_mobile_v2.0_table_structure|PubLayNetæ•°æ®é›†è®ç»ƒçš„è‹±æ–‡è¡¨æ ¼åœºæ™¯çš„è¡¨æ ¼ç»“æž„é¢„æµ‹|18.6M|[æŽ¨ç†æ¨¡åž‹](https://paddleocr.bj.bcebos.com/dygraph_v2.0/table/en_ppocr_mobile_v2.0_table_structure_infer.tar) / [è®ç»ƒæ¨¡åž‹](https://paddleocr.bj.bcebos.com/dygraph_v2.1/table/en_ppocr_mobile_v2.0_table_structure_train.tar) |
+|en_ppocr_mobile_v2.0_table_structure|PubTabNetæ•°æ®é›†è®ç»ƒçš„è‹±æ–‡è¡¨æ ¼åœºæ™¯çš„è¡¨æ ¼ç»“æž„é¢„æµ‹|18.6M|[æŽ¨ç†æ¨¡åž‹](https://paddleocr.bj.bcebos.com/dygraph_v2.0/table/en_ppocr_mobile_v2.0_table_structure_infer.tar) / [è®ç»ƒæ¨¡åž‹](https://paddleocr.bj.bcebos.com/dygraph_v2.1/table/en_ppocr_mobile_v2.0_table_structure_train.tar) |
 
 <a name="3"></a>
 ## 3. VQAæ¨¡åž‹
-- 
GitLab