2 rokov pred · 65a4f20944
--- a/core/line_parser.py
+++ b/core/line_parser.py
@@ -0,0 +1,103 @@
 
				+import numpy as np
			
 
				+from dataclasses import dataclass
			
 
				+
			
 
				+# result 对象
			
 
				+@dataclass
			
 
				+class OcrResult(object):
			
 
				+    box: np.ndarray
			
 
				+    txt: str
			
 
				+    conf: float
			
 
				+
			
 
				+    def __hash__(self):
			
 
				+        return hash(repr(self))
			
 
				+
			
 
				+    def __repr__(self):
			
 
				+        return f'txt: {self.txt}, box: {self.box.tolist()}, conf: {self.conf}'
			
 
				+
			
 
				+    @property
			
 
				+    def lt(self):
			
 
				+        l, t = np.min(self.box, 0)
			
 
				+        return [l, t]
			
 
				+
			
 
				+    @property
			
 
				+    def rb(self):
			
 
				+        r, b = np.max(self.box, 0)
			
 
				+        return [r, b]
			
 
				+
			
 
				+    @property
			
 
				+    def wh(self):
			
 
				+        l, t = self.lt
			
 
				+        r, b = self.rb
			
 
				+        return [r - l, b - t]
			
 
				+
			
 
				+    def one_line(self, b, is_horizontal, eps: float = 20.0) -> bool:
			
 
				+        if is_horizontal:
			
 
				+            return abs(self.lt[1] - b.lt[1]) < eps
			
 
				+        else:
			
 
				+            return abs(self.rb[0] - b.rb[0]) < eps
			
 
				+
			
 
				+
			
 
				+# 行处理器
			
 
				+class LineParser(object):
			
 
				+    def __init__(self, ocr_raw_result):
			
 
				+        self.ocr_res = []
			
 
				+        for re in ocr_raw_result:
			
 
				+            o = OcrResult(np.array(re[0]), re[1][0], re[1][1])
			
 
				+            self.ocr_res.append(o)
			
 
				+        self.eps = self.avg_height * 0.66
			
 
				+
			
 
				+    @property
			
 
				+    def is_horizontal(self):
			
 
				+        res = self.ocr_res
			
 
				+        wh = np.stack([np.abs(np.array(r.lt) - np.array(r.rb)) for r in res])
			
 
				+        return np.sum(wh[:, 0] > wh[:, 1]) > np.sum(wh[:, 0] < wh[:, 1])
			
 
				+
			
 
				+    @property
			
 
				+    def avg_height(self):
			
 
				+        idx = self.is_horizontal + 0
			
 
				+        return np.mean(np.array([r.wh[idx] for r in self.ocr_res]))
			
 
				+
			
 
				+    @property
			
 
				+    def confidence(self):
			
 
				+        return np.mean([r.conf for r in self.ocr_res])
			
 
				+
			
 
				+    # 处理器函数
			
 
				+    def parse(self, eps=40.0):
			
 
				+        # 存返回值
			
 
				+        res = []
			
 
				+
			
 
				+        # 需要 处理的 OcrResult 对象  的长度
			
 
				+        length = len(self.ocr_res)
			
 
				+
			
 
				+        # 如果字段数 小于等于1 就抛出异常
			
 
				+        if length <= 1:
			
 
				+            raise Exception('无法识别')
			
 
				+
			
 
				+        # 遍历数组 并处理他
			
 
				+        for i in range(length):
			
 
				+            # 拿出 OcrResult对象的 第i值 -暂存-
			
 
				+            res_i = self.ocr_res[i]
			
 
				+
			
 
				+            # any：-> True
			
 
				+            #       -input: 可迭代对象   |   -output: bool
			
 
				+            #       -如果iterable的任何元素为true，则返回true。如果iterable为空，则返回false。 -与🚪-
			
 
				+            # map: -> [False, False, False, False, True, True, False, False]
			
 
				+            #       -input: (函数, 可迭代对象)     ｜    -output: 可迭代对象
			
 
				+            #       -把 res 喂给lambda --lambda返回True的值-->  输出 新的可迭代对象
			
 
				+
			
 
				+            # 这次的 res_i 之前已经在结果集中，就继续下一个
			
 
				+            if any(map(lambda x: res_i in x, res)): continue
			
 
				+
			
 
				+            # set() -> {}
			
 
				+            # 初始化一个集合 即-输出-
			
 
				+            res_row = set()
			
 
				+
			
 
				+            for j in range(i, length):
			
 
				+                res_j = self.ocr_res[j]
			
 
				+                if res_i.one_line(res_j, self.is_horizontal, self.eps):
			
 
				+                    # LineParser 对象  不可以直接加入字典
			
 
				+
			
 
				+                    res_row.add(res_j)
			
 
				+            res.append(res_row)
			
 
				+        idx = self.is_horizontal + 0
			
 
				+        return sorted([list(r) for r in res], key=lambda x: x[0].lt[idx])
			
--- a/core/ocr.py
+++ b/core/ocr.py
@@ -1,4 +1,6 @@
 
				 from dataclasses import dataclass
			
 
				+
			
 
				+from core.line_parser import LineParser
			
 
				 from core.parser import *
			
 
				 from core.direction import *
			
 
				 import numpy as np
			
@@ -15,13 +17,17 @@ class IdCardOcr:
 
				         txts, confs, result = self._ocr(image)
			
 
				         angle = self.angle_detector.detect_angle(image, result)
			
 
				 
			
 
				+        line_parser = LineParser(result)
			
 
				+        line_result = line_parser.parse()
			
 
				+        conf = line_parser.confidence
			
 
				+
			
 
				         if int(image_type) == 0:
			
 
				-            parser = FrontParser(txts, confs)
			
 
				+            parser = FrontParser(line_result)
			
 
				         elif int(image_type) == 1:
			
 
				-            parser = BackParser(txts, confs)
			
 
				+            parser = BackParser(line_result)
			
 
				         else:
			
 
				             raise Exception('无法识别')
			
 
				-        return self._post_process(angle, parser, image_type)
			
 
				+        return self._post_process(conf, angle, parser, image_type)
			
 
				 
			
 
				     def _pre_process(self, image) -> (np.ndarray, int):
			
 
				         angle = detect_angle(image)
			
@@ -50,9 +56,9 @@ class IdCardOcr:
 
				         # print("......................................")
			
 
				         return txts, confs, result
			
 
				 
			
 
				-    def _post_process(self, angle: int, parser: Parser, image_type: str):
			
 
				+    def _post_process(self, conf, angle: int, parser: Parser, image_type: str):
			
 
				         ocr_res = parser.parse()
			
 
				-        conf = parser.confidence
			
 
				+
			
 
				 
			
 
				         res = {
			
 
				             "confidence": conf,
			
--- a/core/parser.py
+++ b/core/parser.py
@@ -4,6 +4,9 @@ from dataclasses import dataclass
 
				 from collections import defaultdict
			
 
				 import numpy as np
			
 
				 import cpca
			
 
				+from typing import List
			
 
				+
			
 
				+from core.line_parser import OcrResult
			
 
				 
			
 
				 
			
 
				 @dataclass
			
@@ -16,10 +19,8 @@ class RecItem:
 
				 
			
 
				 
			
 
				 class Parser(object):
			
 
				-    def __init__(self, txts, confs):
			
 
				-        self.result = txts
			
 
				-        self.confs = confs
			
 
				-        assert len(self.result) == len(self.confs), 'result and confs do not match'
			
 
				+    def __init__(self, ocr_results: List[OcrResult]):
			
 
				+        self.result = ocr_results
			
 
				         self.res = defaultdict(RecItem)
			
 
				         self.keys = ["name", "id", "ethnicity", "gender", "birthday",
			
 
				                      "address", "address_province", "address_city", "address_region", "address_detail", "expire_date"]
			
@@ -30,254 +31,189 @@ class Parser(object):
 
				     def parse(self):
			
 
				         return self.res
			
 
				 
			
 
				-    @property
			
 
				-    def confidence(self):
			
 
				-        return 0.
			
 
				-
			
 
				 
			
 
				 class FrontParser(Parser):
			
 
				     """
			
 
				     """
			
 
				 
			
 
				-    def __init__(self, txts, confs):
			
 
				-        Parser.__init__(self, txts, confs)
			
 
				-        self.result = [
			
 
				-            i.replace(" ", "").translate(str.maketrans("", "", string.punctuation))
			
 
				-            for i in txts
			
 
				-        ]
			
 
				-        assert len(self.result) == len(self.confs), 'result and confs do not match'
			
 
				+    def __init__(self, ocr_results: List[OcrResult]):
			
 
				+        Parser.__init__(self, ocr_results)
			
 
				 
			
 
				     def birth(self):
			
 
				         if len(self.res["id"].text) == 18:
			
 
				             # 342423 2001  0  2    1  5    6552
			
 
				             # 012345 6789  10 11   12 13   14
			
 
				             str_num = self.res["id"].text
			
 
				-            date = list(str_num[6:10] + "年" + str_num[10:12] + "月" + str_num[12:14] + "日")
			
 
				-            if date[date.index("月") - 2] == "0":
			
 
				-                del date[date.index("月") - 2]
			
 
				-            if date[date.index("日") - 2] == "0":
			
 
				-                del date[date.index("日") - 2]
			
 
				-            self.res["birthday"].text = "".join(date)
			
 
				+            date = str_num[6:10] + "年" + str_num[10:12] + "月" + str_num[12:14] + "日"
			
 
				+            self.res["birthday"] = RecItem(date, self.res['id'].confidence)
			
 
				 
			
 
				     def card_no(self):
			
 
				         """
			
 
				         身份证号码
			
 
				         """
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				-
			
 
				-            # 身份证号码
			
 
				-            if "X" in txt or "x" in txt:
			
 
				-                res = re.findall("\d*[X|x]", txt)
			
 
				-            else:
			
 
				-                res = re.findall("\d{16,18}", txt)
			
 
				+        for idx, row in enumerate(self.result):
			
 
				+            for r in row:
			
 
				+                txt = r.txt
			
 
				 
			
 
				-            if len(res) > 0:
			
 
				-                if len(res[0]) == 18:
			
 
				-                    self.res["id"].text = res[0].replace("号码", "")
			
 
				-                    self.res["id"].confidence = self.confs[i]
			
 
				-                    self.res["gender"].text = "男" if int(res[0][16]) % 2 else "女"
			
 
				-                    self.res["gender"].confidence = self.confs[i]
			
 
				-                break
			
 
				-
			
 
				-    def full_name(self):
			
 
				-        """
			
 
				-        身份证姓名
			
 
				-        """
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				-            length = len(txt)
			
 
				-            if "姓名" in txt:
			
 
				-                if len(txt) < 7:
			
 
				-                    res = re.findall("姓名[\u4e00-\u9fa5]{1,4}", txt)
			
 
				-                    # 三个字名字
			
 
				-                    if len(res) > 0:
			
 
				-                        self.res["name"].text = res[0].split("姓名")[-1]
			
 
				-                        self.res["name"].confidence = self.confs[i]
			
 
				-                        self.result[i] = "temp"  # 避免身份证姓名对地址造成干扰
			
 
				-                        break
			
 
				+                # 身份证号码
			
 
				+                if "X" in txt or "x" in txt:
			
 
				+                    res = re.findall("\d*[X|x]", txt)
			
 
				                 else:
			
 
				-                    res = txt[2:]
			
 
				-                    name_list = []
			
 
				-                    point_unicode = ["\u2E31", "\u2218", "\u2219", "\u22C5", "\u25E6", "\u2981",
			
 
				-                                     "\u00B7", "\u0387", "\u05BC", "\u16EB", "\u2022", "\u2027",
			
 
				-                                     "\u2E30", "\uFF0E", "\u30FB", "\uFF65", "\u10101"]
			
 
				-                    for n in range(len(point_unicode)):
			
 
				-                        point = re.findall(point_unicode[n], res)
			
 
				-                        if len(point) != 0:
			
 
				-                            name_list = res.split(point[0])
			
 
				-                            for m in range(len(name_list)):
			
 
				-                                name_list[m] = name_list[m].replace(' ', '')
			
 
				-                            res = name_list[0] + '\u00B7' + name_list[1]
			
 
				-
			
 
				-                self.res["name"].text = res
			
 
				-                self.res["name"].confidence = self.confs[i]
			
 
				-                self.result[i] = "temp"  # 避免身份证姓名对地址造成干扰
			
 
				-
			
 
				-    def gender(self):
			
 
				+                    res = re.findall("\d{16,18}", txt)
			
 
				+
			
 
				+                if len(res) > 0:
			
 
				+                    if len(res[0]) == 18:
			
 
				+                        self.res["id"].text = res[0]
			
 
				+                        self.res["id"].confidence = r.conf
			
 
				+                        self.res["gender"].text = "男" if int(res[0][16]) % 2 else "女"
			
 
				+                        self.res["gender"].confidence = r.conf
			
 
				+                        if idx < 2:
			
 
				+                            self.result = self.result[idx + 1:]
			
 
				+                            self.result.reverse()
			
 
				+                        else:
			
 
				+                            self.result = self.result[:idx]
			
 
				+                    return
			
 
				+        raise Exception('无法识别')
			
 
				+
			
 
				+    def name(self):
			
 
				         """
			
 
				-        性别女民族汉
			
 
				+        姓名
			
 
				         """
			
 
				-        if len(self.res["gender"].text) != 0: return
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				-            if "男" in txt:
			
 
				-                self.res["gender"] = RecItem("男", self.confs[i])
			
 
				-                break
			
 
				 
			
 
				-            if "女" in txt:
			
 
				-                self.res["gender"] = RecItem("女", self.confs[i])
			
 
				-                break
			
 
				+        if len(self.result[0]) == 2:
			
 
				+            for r in self.result[0]:
			
 
				+                if '姓' in r.txt or ('名' in r.txt and len(r.txt) < 3):
			
 
				+                    continue
			
 
				+                else:
			
 
				+                    self.res['name'] = RecItem(r.txt, r.conf)
			
 
				+                    return
			
 
				+        if len(self.result[0]) == 1:
			
 
				+            txt = self.result[0][0].txt
			
 
				+            conf = self.result[0][0].conf
			
 
				+            if "姓名" in txt:
			
 
				+
			
 
				+                res = txt[2:]
			
 
				+                name_list = []
			
 
				+                point_unicode = ["\u2E31", "\u2218", "\u2219", "\u22C5", "\u25E6", "\u2981",
			
 
				+                                 "\u00B7", "\u0387", "\u05BC", "\u16EB", "\u2022", "\u2027",
			
 
				+                                 "\u2E30", "\uFF0E", "\u30FB", "\uFF65", "\u10101"]
			
 
				+                for n in range(len(point_unicode)):
			
 
				+                    point = re.findall(point_unicode[n], res)
			
 
				+                    if len(point) != 0:
			
 
				+                        name_list = res.split(point[0])
			
 
				+                        self.res['name'] = RecItem(name_list[0].replace('姓名') + '\u00B7' + name_list[1], conf)
			
 
				+                        return
			
 
				+
			
 
				+                res = re.findall("姓名[\u4e00-\u9fa5]{1,7}", txt)
			
 
				+                if len(res) > 0:
			
 
				+                    self.res["name"] = RecItem(res[0].split("姓名")[-1], conf)
			
 
				+                    return
			
 
				+        raise Exception('无法识别')
			
 
				 
			
 
				     def national(self):
			
 
				         # 性别女民族汉
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				+        if len(self.result[1]) == 1:
			
 
				+            txt = self.result[1][0].txt
			
 
				+            conf = self.result[1][0].conf
			
 
				             res = re.findall(".*民族[\u4e00-\u9fa5]+", txt)
			
 
				 
			
 
				             if len(res) > 0:
			
 
				-                self.res["ethnicity"] = RecItem(res[0].split("族")[-1], self.confs[i])
			
 
				-                break
			
 
				+                self.res["ethnicity"] = RecItem(res[0].split("族")[-1], conf)
			
 
				+                return
			
 
				 
			
 
				     def address(self):
			
 
				         """
			
 
				         身份证地址
			
 
				         """
			
 
				-        addString = []
			
 
				-        conf = []
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				-            txt = txt.replace("号码", "")
			
 
				-            if "公民" in txt:
			
 
				-                txt = "temp"
			
 
				-            # 身份证地址
			
 
				-
			
 
				-            if (
			
 
				-                    "住址" in txt
			
 
				-                    or "址" in txt
			
 
				-                    or "省" in txt
			
 
				-                    or "市" in txt
			
 
				-                    or "县" in txt
			
 
				-                    or "街" in txt
			
 
				-                    or "乡" in txt
			
 
				-                    or "村" in txt
			
 
				-                    or "镇" in txt
			
 
				-                    or "区" in txt
			
 
				-                    or "城" in txt
			
 
				-                    or "组" in txt
			
 
				-                    or "旗" in txt
			
 
				-                    or "号" in txt
			
 
				-            ):
			
 
				-                # if "住址" in txt or "省" in txt or "址" in txt:
			
 
				-                if "住址" in txt or "省" in txt or "址" in txt or \
			
 
				-                        ('市' in txt and len(addString) > 0 and '市' not in addString[0]):
			
 
				-                    addString.insert(0, txt.split("址")[-1])
			
 
				-                else:
			
 
				-                    addString.append(txt)
			
 
				-                conf.append(self.confs[i])
			
 
				-                self.result[i] = "temp"
			
 
				-        if len(addString) > 0:
			
 
				-            self.res["address"].text = "".join(addString)
			
 
				-            self.res["address"].confidence = np.mean(conf)
			
 
				-        # print(f'addr: {self.res["Address"]}')
			
 
				+        res = []
			
 
				+        confs = []
			
 
				 
			
 
				-    def split_addr(self):
			
 
				-        if self.res["address"].text:
			
 
				-            conf = self.res["address"].confidence
			
 
				-            df = cpca.transform([self.res["address"].text])
			
 
				-            # print(df)
			
 
				-
			
 
				-            province = df.iloc[0, 0]
			
 
				-            city = df.iloc[0, 1]
			
 
				-            region = df.iloc[0, 2]
			
 
				-            detail = df.iloc[0, 3]
			
 
				-            print(f'pronvince: {province}, city: {city}, region: {region}, detail: {detail}')
			
 
				-            self.res["address_province"] = RecItem(province, conf)
			
 
				-            self.res["address_city"] = RecItem(city, conf)
			
 
				-            if detail and "旗" in detail:
			
 
				-                temp_region = []
			
 
				-                temp_region.insert(0, detail.split("旗")[0] + "旗")
			
 
				-                self.res["address_region"] = RecItem(temp_region[0], conf)
			
 
				-                self.res["address_detail"] = RecItem(detail.split("旗")[-1], conf)
			
 
				-            else:
			
 
				-                self.res["address_region"] = RecItem(region, conf)
			
 
				-                self.res["address_detail"] = RecItem(detail, conf)
			
 
				+        for row in self.result[3:]:
			
 
				+            for r in row:
			
 
				+                txt = r.txt
			
 
				 
			
 
				-    def expire_date(self):
			
 
				-        for txt, conf in zip(self.result, self.confs):
			
 
				-            txt = txt.replace('.', '')
			
 
				-            res = re.findall('\d{8}\-\d{8}', txt)
			
 
				-            if res:
			
 
				-                self.res["expire_date"] = RecItem(res[0], conf)
			
 
				-                break
			
 
				-            res = re.findall('\d{8}\-长期', txt)
			
 
				-            if res:
			
 
				-                self.res["expire_date"] = RecItem(res[0], conf)
			
 
				-                break
			
 
				-
			
 
				-    def predict_name(self):
			
 
				-        """
			
 
				-        如果PaddleOCR返回的不是姓名xx连着的，则需要去猜测这个姓名，此处需要改进
			
 
				-        """
			
 
				-        if len(self.res['name'].text) > 1: return
			
 
				-        for i in range(len(self.result)):
			
 
				-            txt = self.result[i]
			
 
				-            if 1 < len(txt) < 5:
			
 
				                 if (
			
 
				-                        "性别" not in txt
			
 
				-                        and "姓名" not in txt
			
 
				-                        and "民族" not in txt
			
 
				-                        and "住址" not in txt
			
 
				-                        and "出生" not in txt
			
 
				-                        and "号码" not in txt
			
 
				-                        and "身份" not in txt
			
 
				+                        "住址" in txt
			
 
				+                        or "址" in txt
			
 
				+                        or "省" in txt
			
 
				+                        or "市" in txt
			
 
				+                        or "县" in txt
			
 
				+                        or "街" in txt
			
 
				+                        or "乡" in txt
			
 
				+                        or "村" in txt
			
 
				+                        or "镇" in txt
			
 
				+                        or "区" in txt
			
 
				+                        or "城" in txt
			
 
				+                        or "组" in txt
			
 
				+                        or "旗" in txt
			
 
				+                        or "号" in txt
			
 
				                 ):
			
 
				-                    result = re.findall("[\u4e00-\u9fa5]{2,4}", txt)
			
 
				-                    if len(result) > 0:
			
 
				-                        self.res["Name"] = RecItem(result[0], self.confs[i])
			
 
				-                        break
			
 
				+                    # if "住址" in txt or "省" in txt or "址" in txt:
			
 
				+                    if "住址" in txt or "址" in txt:
			
 
				+                        res.append(txt.split("址")[-1])
			
 
				+                    else:
			
 
				+                        res.append(txt)
			
 
				+                    confs.append(r.conf)
			
 
				+
			
 
				+        if len(res) > 0:
			
 
				+            self.res["address"] = RecItem("".join(res), np.mean(confs))
			
 
				+            self.split_addr()
			
 
				+            return
			
 
				+        raise Exception('无法识别')
			
 
				 
			
 
				-    @property
			
 
				-    def confidence(self):
			
 
				-        return np.mean(self.confs)
			
 
				+    def split_addr(self):
			
 
				+        conf = self.res["address"].confidence
			
 
				+        df = cpca.transform([self.res["address"].text])
			
 
				+        # print(df)
			
 
				+
			
 
				+        province = df.iloc[0, 0]
			
 
				+        city = df.iloc[0, 1]
			
 
				+        region = df.iloc[0, 2]
			
 
				+        detail = df.iloc[0, 3]
			
 
				+        print(f'pronvince: {province}, city: {city}, region: {region}, detail: {detail}')
			
 
				+        self.res["address_province"] = RecItem(province, conf)
			
 
				+        self.res["address_city"] = RecItem(city, conf)
			
 
				+        if detail and "旗" in detail:
			
 
				+            temp_region = []
			
 
				+            temp_region.insert(0, detail.split("旗")[0] + "旗")
			
 
				+            self.res["address_region"] = RecItem(temp_region[0], conf)
			
 
				+            self.res["address_detail"] = RecItem(detail.split("旗")[-1], conf)
			
 
				+        else:
			
 
				+            self.res["address_region"] = RecItem(region, conf)
			
 
				+            self.res["address_detail"] = RecItem(detail, conf)
			
 
				+        if not self.res['address_region'].text or not self.res['address_detail'].text:
			
 
				+            raise Exception('无法识别')
			
 
				 
			
 
				     def parse(self):
			
 
				-        self.full_name()
			
 
				-        self.national()
			
 
				         self.card_no()
			
 
				-        self.address()
			
 
				-        self.split_addr()
			
 
				+        self.name()
			
 
				+        self.national()
			
 
				         self.birth()
			
 
				-        self.gender()
			
 
				-        self.expire_date()
			
 
				-        self.predict_name()
			
 
				-        if not self.res["id"].text:
			
 
				-            raise Exception("没有识别到身份证号")
			
 
				+        self.address()
			
 
				         return {key: self.res[key].to_dict() for key in self.keys}
			
 
				 
			
 
				 
			
 
				 class BackParser(Parser):
			
 
				-    def __init__(self, txts, confs):
			
 
				-        Parser.__init__(self, txts, confs)
			
 
				+    def __init__(self, ocr_results: List[OcrResult]):
			
 
				+        Parser.__init__(self, ocr_results)
			
 
				 
			
 
				     def expire_date(self):
			
 
				-        for txt, conf in zip(self.result, self.confs):
			
 
				-            txt = txt.replace('.', '')
			
 
				-            res = re.findall('\d{8}\-\d{8}', txt)
			
 
				-            if res:
			
 
				-                self.res["expire_date"] = RecItem(res[0], conf)
			
 
				-                break
			
 
				-            res = re.findall('\d{8}\-长期', txt)
			
 
				-            if res:
			
 
				-                self.res["expire_date"] = RecItem(res[0], conf)
			
 
				-                break
			
 
				-
			
 
				-    @property
			
 
				-    def confidence(self):
			
 
				-        return np.mean(self.confs)
			
 
				+        for row in self.result:
			
 
				+            for r in row:
			
 
				+                txt = r.txt
			
 
				+                txt = txt.replace('.', '')
			
 
				+                res = re.findall('\d{8}\-\d{8}', txt)
			
 
				+                if res:
			
 
				+                    self.res["expire_date"] = RecItem(res[0], r.conf)
			
 
				+                    return
			
 
				+                res = re.findall('\d{8}\-长期', txt)
			
 
				+                if res:
			
 
				+                    self.res["expire_date"] = RecItem(res[0], r.conf)
			
 
				+                    return
			
 
				+        raise Exception('无法识别')
			
 
				 
			
 
				     def parse(self):
			
 
				         self.expire_date()
			
 
				         if not self.res["expire_date"].text:
			
 
				             raise Exception("无法识别")
			
 
				-        return {key: self.res[key].to_dict() for key in self.keys}
			
 
				+        return {key: self.res[key].to_dict() for key in self.keys}