新增火车票及身份证结构化识别

9a2924bd · lywen · 807f8828 · 9a2924bd · 9a2924bd · 9a2924bd
38 changed file
--- a/README.md
+++ b/README.md
@@ -4,7 +4,7 @@
 - [x]  文字方向检测 0、90、180、270度检测（支持dnn/tensorflow） 
 - [x]  支持(darknet/opencv dnn /keras)文字检测,暂时公布（keras版本训练）
 - [x]  不定长OCR训练(英文、中英文) crnn\dense ocr 
-
+- [x]  新增对身份证/火车票结构化数据识别

 ## 环境部署

@@ -45,11 +45,11 @@ ipython app.py 8080 ##8080端口号，可以设置任意端口

 ## 识别结果展示

-<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/img1.png"/>
-<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/4.png"/>
+<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/train1/png"/>
 <img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/card1.png"/>
+<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/demo2.png"/>

-## Play with Docker Container
+## Play with Docker Container(镜像有些滞后)
 ``` Bash
 docker pull zergmk2/chineseocr
 docker run -d -p 8080:8080 zergmk2/chineseocr
@@ -58,7 +58,7 @@ docker run -d -p 8080:8080 zergmk2/chineseocr
 ## 访问服务
 http://127.0.0.1:8080/ocr

-<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/demo.png"/>
+<img width="500" height="300" src="https://github.com/chineseocr/chineseocr/blob/master/test/demo1.png"/>


 ## 参考

--- a/app.py
+++ b/app.py
@@ -13,6 +13,11 @@ web.config.debug  = True
 import model
 render = web.template.render('templates', base='base')
 from config import DETECTANGLE
+from apphelper.image import union_rbox
+from application import trainTicket,idcard 
+
+
+billList = ['通用OCR','火车票','身份证']

 class OCR:
    """通用OCR识别"""
@@ -25,11 +30,13 @@ class OCR:
        post['width'] = 600
        post['W'] = 600
        post['uuid'] = uuid.uuid1().__str__()
+        post['billList'] = billList
        return render.ocr(post)

    def POST(self):
        data = web.data()
        data = json.loads(data)
+        billModel = data.get('billModel','')
        imgString = data['imgString'].encode().split(b';base64,')[-1]
        imgString = base64.b64decode(imgString)
        jobid = uuid.uuid1().__str__()
@@ -58,13 +65,29 @@ class OCR:
                                    ifadjustDegree=False##是否先小角度调整文字倾斜角度
                                   )
        
+        
+        
+        if billModel=='' or billModel=='通用OCR' :
+            result = union_rbox(result,0.2)
+            res = [{'text':x['text'],'name':str(i)} for i,x in enumerate(result)]
+        elif billModel=='火车票':
+            res = trainTicket.trainTicket(result)
+            res = res.res
+            res =[ {'text':res[key],'name':key} for key in res]
+            
+        elif billModel=='身份证':
+            
+            res = idcard.idcard(result)
+            res = res.res
+            res =[ {'text':res[key],'name':key} for key in res]
+            
+        
        timeTake = time.time()-timeTake
-        res = map(lambda x:{'w':x['w'],'h':x['h'],'cx':x['cx'],'cy':x['cy'],'degree':x['degree'],'text':x['text']}, result)
-        res = list(res)
-
+         
+        
        os.remove(path)
        return json.dumps({'res':res,'timeTake':round(timeTake,4)},ensure_ascii=False)
-
+        




--- a/apphelper/image.py
+++ b/apphelper/image.py
@@ -525,3 +525,67 @@ def get_boxes( bboxes):
    return text_recs


+
+def union_rbox(result,alpha=0.1):
+    """
+    按行合并box
+    """            
+    def diff(box1,box2):
+        """
+        计算box1,box2之间的距离
+        """
+        cy1 = box1['cy']
+        cy2 = box2['cy']
+        h1  = box1['h']
+        h2 = box2['h']
+        
+        return abs(cy1-cy2)/max(0.01,min(h1/2,h1/2))
+    
+    def sort_group_box(boxes):
+        """
+        对box进行排序, 并合并box
+        """   
+        N = len(boxes)
+        boxes = sorted(boxes,key=lambda x:x['cx'])
+        text  = ' '.join([bx['text'] for bx in boxes])
+        box4 = np.zeros((N,8))
+        for i in range(N):
+            cx =boxes[i]['cx']
+            cy = boxes[i]['cy']
+            degree =boxes[i]['degree']
+            w  = boxes[i]['w']
+            h = boxes[i]['h']
+            x1,y1,x2,y2,x3,y3,x4,y4 = xy_rotate_box(cx, cy, w, h, degree/180*np.pi)
+            box4[i] = [x1,y1,x2,y2,x3,y3,x4,y4]
+            
+        x1 = box4[:,0].min()
+        y1 = box4[:,1].min()
+        x2 = box4[:,2].max()
+        y2 = box4[:,3].min()
+        x3 = box4[:,4].max()
+        y3 = box4[:,5].max()
+        x4 = box4[:,6].min()
+        y4 = box4[:,7].max()
+        angle,w,h,cx,cy = solve([x1,y1,x2,y2,x3,y3,x4,y4])
+        return {'text':text,'cx':cx,'cy':cy,'w':w,'h':h,'degree':angle/np.pi*180}
+    
+    
+
+    newBox = []
+    for line in result:
+        if len(newBox)==0:
+            newBox.append([line])
+        else:
+            check=False
+            for box in newBox[-1]:
+                if diff(line,box)>alpha:
+                    check = True
+                    
+            if not check:
+                newBox[-1].append(line)
+            else:
+                newBox.append([line])
+    newBox = [sort_group_box(bx) for bx in newBox]
+    return newBox
+            
+
--- a/static/css/.Rhistory
+++ b/static/css/.Rhistory
--- a/application/idcard.py
+++ b/application/idcard.py
+"""
+身份证
+"""
+from apphelper.image import union_rbox
+import re
+class idcard:
+    """
+    身份证结构化识别
+    """
+    def __init__(self,result):
+        self.result = union_rbox(result,0.2)
+        self.N = len(self.result)
+        self.res = {}
+        self.full_name()
+        self.sex()
+        self.birthday()
+        self.birthNo()
+        self.address()
+        
+    
+    def full_name(self):
+        """
+        身份证姓名
+        """
+        name={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##匹配身份证姓名
+            res = re.findall("姓名[\u4e00-\u9fa5]{1,4}",txt)
+            if len(res)>0:
+                name['姓名']  =res[0].replace('姓名','')
+                self.res.update(name) 
+                break
+
+    def sex(self):
+        """
+        性别女民族汉
+        """
+        sex={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            if '男'  in txt:
+                    sex["性别"] = '男'
+            elif '女'  in txt:
+                    sex["性别"] = '女'
+                    
+            ##性别女民族汉
+            res = re.findall(".*民族[\u4e00-\u9fa5]+",txt)
+            if len(res)>0:
+                sex["民族"] = res[0].split('民族')[-1]
+                self.res.update(sex) 
+                break
+                
+   
+    
+    def birthday(self):
+        """
+        出生年月
+        """
+        birth={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##出生年月
+            res = re.findall('出生\d*年\d*月\d*日',txt)
+            res = re.findall('\d*年\d*月\d*日',txt)
+            
+            if len(res)>0:
+                birth['出生年月']  =res[0].replace('出生','').replace('年','-').replace('月','-').replace('日','')
+                self.res.update(birth) 
+                break
+                
+    def birthNo(self):
+        """
+        身份证号码
+        """
+        No={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##身份证号码
+            res = re.findall('号码\d*[X|x]',txt)
+            res += re.findall('号码\d*',txt)
+            res += re.findall('\d{16,18}',txt)
+            
+            if len(res)>0:
+                No['身份证号码']  =res[0].replace('号码','')
+                self.res.update(No) 
+                break    
+                
+    def address(self):
+        """
+        身份证地址
+        ##此处地址匹配还需完善
+        """
+        add={}
+        addString=[]
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            
+            ##身份证地址
+            if '住址' in txt or '省' in txt or '市' in txt or '县' in txt or '街' in txt or '村' in txt or "镇" in txt or "区" in txt or "城" in txt:
+                addString.append(txt.replace('住址',''))
+            
+        if len(addString)>0:
+            add['身份证地址']  =''.join(addString)
+            self.res.update(add) 
+                                
+        
\ No newline at end of file
--- a/application/trainTicket.py
+++ b/application/trainTicket.py
+"""
+火车票
+"""
+from apphelper.image import union_rbox
+import re
+class trainTicket:
+    """
+    火车票结构化识别
+    """
+    def __init__(self,result):
+        self.result = union_rbox(result,0.2)
+        self.N = len(self.result)
+        self.res = {}
+        self.station()
+        self.time()
+        self.price()
+        self.full_name()
+        
+    def station(self):
+        """
+        安顺站K492贵阳站
+        re.findall('[一-龥]+站','安顺站K492贵阳站'),re.findall('[一-龥]+站(.+?)[][一-龥]+站','安顺站K492贵阳站')
+        
+        """
+        station={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            
+            res = re.findall('[一-龥]+站',txt),re.findall('[一-龥]+站(.+?)[][一-龥]+站',txt)
+            if len(res[0])>0:
+                
+                station['出发'],station['到达'] = res[0][0].replace('站',''),res[0][1].replace('站','')
+            if len(res[1])>0:
+                station['车次'] = res[1][0]
+                
+            if len(station)>0:
+                self.res.update(station)
+                break
+    
+    def time(self):
+        """
+        提取日期 时间 
+        """
+        time={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##匹配日期
+            res = re.findall('[0-9]{1,4}年[0-9]{1,2}月[0-9]{1,2}日',txt)
+            if len(res)>0:
+                time['日期']  =res[0].replace('年','-').replace('月','-').replace('日','')
+                ##匹配时间
+                res = re.findall('[0-9]{1,2}:[0-9]{1,2}',txt)
+                if len(res)>0:
+                    time['时间']  =res[0]
+                    self.res.update(time)
+                    break
+    
+    def price(self):
+        """
+        车票价格
+        """
+        price={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##车票价格
+            res = re.findall('￥[0-9]{1,4}.[0-9]{1,2}元',txt)
+            res += re.findall('[0-9]{1,4}.[0-9]{1,2}元',txt)
+            res += re.findall('[0-9]{1,6}元',txt)
+            res += re.findall('￥[0-9]{1,4}.[0-9]{1,2}',txt)
+            if len(res)>0:
+                price['车票价格']  =res[0].replace('￥','').replace('元','')
+                self.res.update(price) 
+                break
+                
+    
+                
+    def full_name(self):
+        """
+        姓名
+        """
+        name={}
+        for i in range(self.N):
+            txt = self.result[i]['text'].replace(' ','')
+            txt = txt.replace(' ','')
+            ##车票价格
+            res = re.findall("\d*\*\d*([一-龥]{1,4})",txt)
+            if len(res)>0:
+                name['姓名']  =res[0]
+                self.res.update(name)                
+                
+                
+        
\ No newline at end of file
--- a/static/css/bootstrap.min.css
+++ b/static/css/bootstrap.min.css
--- a/static/css/zzsc.css
+++ b/static/css/zzsc.css
-/* DaTouWang URL: www.datouwang.com */
-body, html {font-family: "Microsoft YaHei","Segoe UI", "Lucida Grande", Helvetica, Arial,sans-serif; font-size: 100%; padding: 0; margin: 0;}
\ No newline at end of file
--- a/static/js/helps.js
+++ b/static/js/helps.js
@@ -5,10 +5,11 @@ function postImg(){
         if(imgJson['num']==0)
         {   loadingGif('loadingGif');
             imgJson['num']=1;//防止重复提交
+          //alert(imgJson["billModel"]);
         jQuery.ajax({
             type: "post",
             url: 'ocr',
-            data:JSON.stringify({"imgString":imgJson["imgString"]}),
+            data:JSON.stringify({"imgString":imgJson["imgString"],"billModel":imgJson["billModel"]}),
           success:function(d){
              loadingGif('loadingGif');
              imgJson['num']=0;//防止重复提交
@@ -116,7 +117,7 @@ function createTable(result,timeTake){
        var tableString =p+ "<table id='billmodeltable' class='gridtable'><tr><th>序号</th><th>值</th></tr>"
                        
        for(var i=0;i<jsObject.length;i++){
-            tableString+="<tr><td><p>"+i+"</p></td><td><p contenteditable='true'>"+jsObject[i]["text"]+"</p></td></tr>";
+            tableString+="<tr><td><p>"+jsObject[i]["name"]+"</p></td><td><p contenteditable='true'>"+jsObject[i]["text"]+"</p></td></tr>";
        }
        tableString+="</table>";
        //jQuery("#mytable").append(p);

--- a/templates/ocr.html
+++ b/templates/ocr.html
@@ -2,9 +2,7 @@ $def with(post)
 <script type="text/javascript" src="static/js/jquery.js"></script>   
 <script type="text/javascript" src="static/js/jquery.form.js"></script> 
 <script type="text/javascript" src="static/js/helps.js"></script> 
-<link rel="stylesheet" href="static/css/bootstrap.min.css">
-<link rel="stylesheet" type="static/css/css" href="css/zzsc.css">
- 
+
 <!-- CSS goes in the document HEAD or added to your external stylesheet -->
 <style type="text/css">
 table.gridtable {
@@ -56,6 +54,9 @@ imgJson = {"imgString":"",
 <div >
      <div class="image-input-container" style="position: absolute; left: 5%; top: 10%;">
                                    <input type="file"   id='imageButton'  accept="image/png, image/bmp, image/jpg, image/jpeg" class="image-local-input" onchange="FunimgPreview('imageButton','Preview','myCanvas')">
+                                    $for bill in post['billList']:
+                                        <div style="font-size:10px" class="class_div" onclick="getValue('$bill',this)"><a href="#" class="button"><span >$bill</span>/</a></div>
+                                    
                                    
      </div> 
 </div>
@@ -91,5 +92,17 @@ imgJson = {"imgString":"",
            jQuery('#imageButton').on('change', function()  
                      {  
                      });
+    
+    function getValue(value,that){
+        //勾选需要识别的类型
+        var divStyle = document.getElementsByClassName("class_div");
+        for(var i=0;i<divStyle.length;i++){
+            divStyle[i].style.background = 'white';
+    }
+    that.style.background = 'pink';
+        
+    imgJson.billModel = value;
+} 
+    
 </script> 

--- a/test.ipynb
+++ b/test.ipynb
--- a/test/4.png
+++ b/test/4.png
--- a/test/card1.png
+++ b/test/card1.png
--- a/test/demo.png
+++ b/test/demo.png
--- a/test/demo1.png
+++ b/test/demo1.png
--- a/test/demo2.png
+++ b/test/demo2.png
--- a/test/fbd49314175a9cd3252920c34a3c5d7d.jpeg
+++ b/test/fbd49314175a9cd3252920c34a3c5d7d.jpeg
--- a/test/img1.png
+++ b/test/img1.png
--- a/test/train.jpg
+++ b/test/train.jpg
--- a/test/train1.png
+++ b/test/train1.png
--- a/train/data/ocr/0/0.jpg
+++ b/train/data/ocr/0/0.jpg
--- a/train/data/ocr/0/0.txt
+++ b/train/data/ocr/0/0.txt
+Halal
\ No newline at end of file
--- a/train/data/ocr/0/1.jpg
+++ b/train/data/ocr/0/1.jpg
--- a/train/data/ocr/0/1.txt
+++ b/train/data/ocr/0/1.txt
+Flame
\ No newline at end of file
--- a/train/data/ocr/0/2.jpg
+++ b/train/data/ocr/0/2.jpg
--- a/train/data/ocr/0/2.txt
+++ b/train/data/ocr/0/2.txt
+Grilled
\ No newline at end of file
--- a/train/data/ocr/0/3.jpg
+++ b/train/data/ocr/0/3.jpg
--- a/train/data/ocr/0/3.txt
+++ b/train/data/ocr/0/3.txt
+Chicken
\ No newline at end of file
--- a/train/data/ocr/0/4.jpg
+++ b/train/data/ocr/0/4.jpg
--- a/train/data/ocr/0/4.txt
+++ b/train/data/ocr/0/4.txt
+I.Dammam:
\ No newline at end of file
--- a/train/data/ocr/0/5.jpg
+++ b/train/data/ocr/0/5.jpg
--- a/train/data/ocr/0/5.txt
+++ b/train/data/ocr/0/5.txt
+0138171856
\ No newline at end of file
--- a/train/data/ocr/0/6.jpg
+++ b/train/data/ocr/0/6.jpg
--- a/train/data/ocr/0/6.txt
+++ b/train/data/ocr/0/6.txt
+I-Khobar
\ No newline at end of file
--- a/train/data/ocr/0/7.jpg
+++ b/train/data/ocr/0/7.jpg
--- a/train/data/ocr/0/7.txt
+++ b/train/data/ocr/0/7.txt
+LG
\ No newline at end of file
--- a/train/text/26BB94CA21C11AB38BC5FC2E08D140CD.jpg
+++ b/train/text/26BB94CA21C11AB38BC5FC2E08D140CD.jpg
--- a/train/text/text-train.ipynb
+++ b/train/text/text-train.ipynb
@@ -233,7 +233,7 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "a,b,newBoxes = show(jpgPath[100])\n"
+    "a,b,newBoxes = show(jpgPath[9])\n"
   ]
  },
  {
@@ -402,7 +402,25 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "img = np.array(Image.open(jpgPath[76]))\n",
+    "p='./train/text/26BB94CA21C11AB38BC5FC2E08D140CD.jpg'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "IMGSIZE=416,416"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "img = np.array(Image.open(p))\n",
    "box,scores = text_detect(img,prob = 0.01)\n",
    "plot_box(img,box)"
   ]