2 gadi atpakaļ · 2c36bfc8d8
--- a/core/direction.py
+++ b/core/direction.py
@@ -3,6 +3,8 @@ from dataclasses import dataclass
 
				 from paddleocr import PaddleOCR
			
 
				 
			
 
				 import numpy as np
			
 
				+import imutils
			
 
				+import matplotlib.pyplot as plt
			
 
				 
			
 
				 
			
 
				 def detect_angle(result, ocr_anchor: OcrAnchor):
			
@@ -12,6 +14,7 @@ def detect_angle(result, ocr_anchor: OcrAnchor):
 
				     print(res)
			
 
				     print('------ angle ocr -------')
			
 
				     is_horizontal = lp.is_horizontal
			
 
				+    # rotate_angle = lp.is_need_rotate
			
 
				     return ocr_anchor.locate_anchor(res, is_horizontal)
			
 
				 
			
 
				 
			
@@ -33,14 +36,19 @@ class AngleDetector(object):
 
				         except Exception as e:
			
 
				             print("direction.py这里有异常。。。。。。")
			
 
				             print(e)
			
 
				-            # 如果第一次识别不到，旋转90度再识别
			
 
				-            img = cv2.rotate(img, cv2.ROTATE_90_CLOCKWISE)
			
 
				-            result = self.ocr.ocr(img, cls=True)
			
 
				+            # 如果第一次识别不到，再识别
			
 
				+            result = self.ocr.ocr(img, cls=False)
			
 
				             angle = detect_angle(result, ocr_anchor)
			
 
				             # 旋转90度之后要重新计算角度
			
 
				-            return (angle - 1 + 4) % 4, result
			
 
				+            # return (angle - 1 + 4) % 4, result
			
 
				+            return angle, result
			
 
				 
			
 
				     def origin_detect(self, img):
			
 
				         # 这边一般是在自己的检测模型result=[]时，再使用官方的模型做个检测，如果这个也没有结果，那就真的检测不出来
			
 
				         result = self.ocr.ocr(img)
			
 
				         return result
			
 
				+
			
 
				+    def det_oneline(self, result):
			
 
				+        # 这边已经是转正之后的图片，不需要考虑是否水平，只要检测是否一行
			
 
				+        lp = LineParser(result)
			
 
				+        return lp.detection_parse()
			
--- a/core/line_parser.py
+++ b/core/line_parser.py
@@ -1,5 +1,6 @@
 
				-from dataclasses import dataclass
			
 
				+import math
			
 
				 import numpy as np
			
 
				+from dataclasses import dataclass
			
 
				 
			
 
				 
			
 
				 # result 对象
			
@@ -31,6 +32,24 @@ class OcrResult(object):
 
				         r, b = self.rb
			
 
				         return [r - l, b - t]
			
 
				 
			
 
				+    @property
			
 
				+    def area(self):
			
 
				+        w, h = self.wh
			
 
				+        return w * h
			
 
				+
			
 
				+    @property
			
 
				+    def is_slope(self):
			
 
				+        """
			
 
				+        function: 10~60,-60~-10度之间，需要旋转图片，因为目前的检测模型对于倾斜角度的不能检测
			
 
				+        return: 需要旋转的角度 ---> tan
			
 
				+        """
			
 
				+        p0 = self.box[0]
			
 
				+        p1 = self.box[1]
			
 
				+        if p0[0] == p1[0]:  # 如果是正常的那就不用转
			
 
				+            return 0
			
 
				+        slope = 1. * (p1[1] - p0[1]) / (p1[0] - p0[0])
			
 
				+        return slope
			
 
				+
			
 
				     @property
			
 
				     def center(self):
			
 
				         l, t = self.lt
			
@@ -42,19 +61,31 @@ class OcrResult(object):
 
				         x_idx = 1 - y_idx
			
 
				         if b.lt[x_idx] < self.lt[x_idx] < self.rb[x_idx] < b.rb[x_idx]: return False
			
 
				         if self.lt[x_idx] < b.lt[x_idx] < b.rb[x_idx] < self.rb[x_idx]: return False
			
 
				-        eps = 0.5 * (self.wh[y_idx] + b.wh[y_idx])
			
 
				+        eps = 0.25 * (self.wh[y_idx] + b.wh[y_idx])
			
 
				         dist = abs(self.center[y_idx] - b.center[y_idx])
			
 
				         return dist < eps
			
 
				 
			
 
				 
			
 
				 # 行处理器
			
 
				 class LineParser(object):
			
 
				-    def __init__(self, ocr_raw_result):
			
 
				+    def __init__(self, ocr_raw_result, filters=None):
			
 
				+        # self.rotate_angle = 0
			
 
				+        if filters is None:
			
 
				+            filters = [lambda x: x.is_slope]
			
 
				         self.ocr_res = []
			
 
				         for re in ocr_raw_result:
			
 
				             o = OcrResult(np.array(re[0]), re[1][0], re[1][1])
			
 
				+            # if any([f(o) for f in filters]): continue
			
 
				             self.ocr_res.append(o)
			
 
				-        self.eps = self.avg_height * 0.66
			
 
				+        self.ocr_res = sorted(self.ocr_res, key=lambda x: x.area, reverse=True)
			
 
				+
			
 
				+        # 找到最大的检测框，大概率就是卡号所在位置
			
 
				+        # max_res = self.ocr_res[0]
			
 
				+        # for f in filters:
			
 
				+        #     k = f(max_res)
			
 
				+        #     self.rotate_angle = math.atan(k) * 180 / math.pi
			
 
				+
			
 
				+        self.eps = self.avg_height * 0.7
			
 
				 
			
 
				     @property
			
 
				     def is_horizontal(self):
			
@@ -62,11 +93,16 @@ class LineParser(object):
 
				         wh = np.stack([np.abs(np.array(r.lt) - np.array(r.rb)) for r in res])
			
 
				         return np.sum(wh[:, 0] > wh[:, 1]) > np.sum(wh[:, 0] < wh[:, 1])
			
 
				 
			
 
				+    # @property
			
 
				+    # def is_need_rotate(self):
			
 
				+    #     return self.rotate_angle
			
 
				+
			
 
				     @property
			
 
				     def avg_height(self):
			
 
				         idx = self.is_horizontal + 0
			
 
				         return np.mean(np.array([r.wh[idx] for r in self.ocr_res]))
			
 
				 
			
 
				+    # 整体置信度
			
 
				     @property
			
 
				     def confidence(self):
			
 
				         return np.mean([r.conf for r in self.ocr_res])
			
@@ -79,15 +115,12 @@ class LineParser(object):
 
				         # 需要 处理的 OcrResult 对象  的长度
			
 
				         length = len(self.ocr_res)
			
 
				 
			
 
				-        # 如果字段数 小于等于1 就抛出异常
			
 
				-        # if length <= 1:
			
 
				-        #     raise Exception('无法识别')
			
 
				-
			
 
				         # 遍历数组 并处理他
			
 
				         for i in range(length):
			
 
				             # 拿出 OcrResult对象的 第i值 -暂存-
			
 
				             res_i = self.ocr_res[i]
			
 
				 
			
 
				+            # 这次的 res_i 之前已经在结果集中，就继续下一个
			
 
				             if any(map(lambda x: res_i in x, res)): continue
			
 
				 
			
 
				             # set() -> {}
			
@@ -96,10 +129,20 @@ class LineParser(object):
 
				 
			
 
				             for j in range(i, length):
			
 
				                 res_j = self.ocr_res[j]
			
 
				+                # 这次的 res_i 之前已经在结果集中，就继续下一个
			
 
				+                if any(map(lambda x: res_j in x, res)): continue
			
 
				+
			
 
				                 if res_i.one_line(res_j, self.is_horizontal, self.eps):
			
 
				-                    if any(map(lambda x: res_j in x, res)): continue
			
 
				                     # LineParser 对象  不可以直接加入字典
			
 
				+
			
 
				                     res_row.add(res_j)
			
 
				             res.append(res_row)
			
 
				         idx = self.is_horizontal + 0
			
 
				-        return sorted([sorted(list(r), key=lambda x: x.lt[1 - idx]) for r in res], key=lambda x: x[0].lt[idx])
			
 
				+        res = sorted([sorted(list(r), key=lambda x: x.lt[1 - idx]) for r in res], key=lambda x: x[0].lt[idx])
			
 
				+
			
 
				+        return res
			
 
				+
			
 
				+    def detection_parse(self, eps=40.0):
			
 
				+        result = self.ocr_res
			
 
				+        if len(result) == 2:
			
 
				+            return result[0].one_line(result[1], True, self.eps)
			
--- a/core/ocr.py
+++ b/core/ocr.py
@@ -1,6 +1,8 @@
 
				 from dataclasses import dataclass
			
 
				 
			
 
				+import cv2
			
 
				 import numpy as np
			
 
				+import math
			
 
				 from paddleocr import PaddleOCR, draw_ocr
			
 
				 
			
 
				 from core.direction import *
			
@@ -20,7 +22,6 @@ class BankOcr:
 
				         print(f'---------- detect angle: {angle} 角度 --------')
			
 
				         # 这里使用自己训练的检测识别模型，在此之前，理想情况下，所有的银行卡的角度都已经是0，（正向）
			
 
				         _, _, result = self._ocr(image)
			
 
				-
			
 
				         # self.imshow(image, result)  # 将检测图片保存
			
 
				         return self._post_process(result, angle)
			
 
				 
			
@@ -38,13 +39,28 @@ class BankOcr:
 
				 
			
 
				         if angle == 1:
			
 
				             image = cv2.rotate(image, cv2.ROTATE_90_COUNTERCLOCKWISE)
			
 
				-        # print("检测出来的角度：", angle)  # 逆时针
			
 
				         if angle == 2:
			
 
				             image = cv2.rotate(image, cv2.ROTATE_180)
			
 
				         if angle == 3:
			
 
				             image = cv2.rotate(image, cv2.ROTATE_90_CLOCKWISE)
			
 
				 
			
 
				-        return image, angle, result
			
 
				+        # if -60 <= rotate_angle <= -20 or 20 <= rotate_angle <= 60:
			
 
				+        #     print("需要旋转角度")
			
 
				+        #     image = imutils.rotate(image, rotate_angle)
			
 
				+
			
 
				+        # 因为有些img像素过大，导致检测框效果不好，识别就会出问题
			
 
				+        h, w, _ = image.shape
			
 
				+        h_ratio = 1 if h <= 1000 else h / 1000
			
 
				+        w_ratio = 1 if w <= 1000 else w / 1000
			
 
				+
			
 
				+        if h_ratio == 1 and w_ratio == 1:
			
 
				+            return image, angle, result
			
 
				+        elif h_ratio != 1 or w_ratio != 1:
			
 
				+            ratio = h_ratio if h_ratio > w_ratio else w_ratio
			
 
				+            image = cv2.resize(image, (w // math.ceil(ratio), h // math.ceil(ratio)))
			
 
				+            print(image.shape)
			
 
				+
			
 
				+            return image, angle, result
			
 
				 
			
 
				     def _ocr(self, image):
			
 
				         # 获取模型检测结果,因为是正的照片了，所以不需要方向分类器
			
@@ -69,29 +85,64 @@ class BankOcr:
 
				         if result:
			
 
				             confs = [line[1][1] for line in result]
			
 
				             print("自己的检测模型得到的conf：", confs)
			
 
				-            if len(result) == 2 and all(map(lambda x: x > 0.975, confs)):
			
 
				-                l_box, r_box = [], []
			
 
				-                l_box.extend(result[0][0])
			
 
				-                r_box.extend(result[1][0])
			
 
				-
			
 
				-                l_max, _ = np.max(l_box, 0)
			
 
				-                r_min, _ = np.min(r_box, 0)
			
 
				 
			
 
				-                if l_max > r_min:
			
 
				-                    print("说明自己的检测模型不好")
			
 
				-                    result = self.angle_detector.origin_detect(image)
			
 
				-            else:
			
 
				-                # 一般情况下，len=1
			
 
				-                flag = 0
			
 
				-                if map(lambda x: x >= 0.975, confs):
			
 
				-                    flag = 1
			
 
				-                # for conf in confs:
			
 
				-                #     if conf >= 0.975:
			
 
				-                #         flag = 1
			
 
				-                #         break
			
 
				-                if flag == 0:
			
 
				-                    print("需要再次进行官方的检测代码。。。。。。。。。。。。")
			
 
				+            # 根绝len(result)分规则判断
			
 
				+            if len(result) == 1:
			
 
				+                if confs[0] > 0.987:
			
 
				+                    txts = [line[1][0] for line in result]
			
 
				+                    return txts, confs, result
			
 
				+                else:
			
 
				+                    print("len(result)=1时，再次用官方代码检测。。。。。。")
			
 
				                     result = self.angle_detector.origin_detect(image)
			
 
				+            elif len(result) == 2:
			
 
				+                # 1.判断两个检测框在不在一行
			
 
				+                is_oneline = self.angle_detector.det_oneline(result)
			
 
				+                # 2.如果不在一行
			
 
				+                if not is_oneline:
			
 
				+                    txts = [line[1][0] for line in result]
			
 
				+                    if not (any(map(lambda x: x > 0.987, confs)) and len(re.findall('\d{16,20}', txts)) > 0):
			
 
				+                        print("len(result)=2,但是不在一行。。。。。。")
			
 
				+                        result = self.angle_detector.origin_detect(image)
			
 
				+                # 3. 如果在一行
			
 
				+                elif is_oneline:
			
 
				+                    if all(map(lambda x: x > 0.987, confs)):
			
 
				+                        l_box, r_box = [], []
			
 
				+                        l_box.extend(result[0][0])
			
 
				+                        r_box.extend(result[1][0])
			
 
				+
			
 
				+                        l_max, _ = np.max(l_box, 0)
			
 
				+                        r_min, _ = np.min(r_box, 0)
			
 
				+
			
 
				+                        if l_max > r_min:
			
 
				+                            print("len(result)=2,在一行，但有重叠。。。。。。")
			
 
				+                            result = self.angle_detector.origin_detect(image)
			
 
				+                    else:
			
 
				+                        print("len(result)=2,在一行，但有一个检测不行。。。。。。")
			
 
				+                        result = self.angle_detector.origin_detect(image)
			
 
				+            elif len(result) > 2:
			
 
				+                print("len(result)=3,直接换官方检测。。。。。。")
			
 
				+                result = self.angle_detector.origin_detect(image)
			
 
				+
			
 
				+            # elif len(result) == 2 and all(map(lambda x: x > 0.975, confs)):
			
 
				+            #     l_box, r_box = [], []
			
 
				+            #     l_box.extend(result[0][0])
			
 
				+            #     r_box.extend(result[1][0])
			
 
				+            #
			
 
				+            #     l_max, _ = np.max(l_box, 0)
			
 
				+            #     r_min, _ = np.min(r_box, 0)
			
 
				+            #
			
 
				+            #     if l_max > r_min:
			
 
				+            #         print("说明自己的检测模型不好")
			
 
				+            #         result = self.angle_detector.origin_detect(image)
			
 
				+            # else:
			
 
				+            #     # 一般情况下，len=1
			
 
				+            #     flag = 0
			
 
				+            #     if all(map(lambda x: x >= 0.975, confs)):
			
 
				+            #         flag = 1
			
 
				+            #
			
 
				+            #     if flag == 0:
			
 
				+            #         print("需要再次进行官方的检测代码。。。。。。。。。。。。")
			
 
				+            #         result = self.angle_detector.origin_detect(image)
			
 
				 
			
 
				         # 如果还是空，那就检测不出来
			
 
				         if not result:
			
--- a/testing/true_test.py
+++ b/testing/true_test.py
@@ -1,74 +0,0 @@
 
				-import unittest
			
 
				-from pathlib import Path
			
 
				-
			
 
				-
			
 
				-from testing.utils import send_request
			
 
				-
			
 
				-
			
 
				-class TestBankCardOcr(unittest.TestCase):
			
 
				-
			
 
				-    def _helper(self, image_path, sta, orient, card_no):
			
 
				-        root = Path(__file__).parent
			
 
				-        image_path = str(root / image_path)
			
 
				-        r = send_request(image_path)
			
 
				-        self.assertEqual(sta, r['status'], f'{image_path} status case error')
			
 
				-        self.assertEqual(orient, r['result']['orientation'], f'{image_path} orientation case error')
			
 
				-        self.assertEqual(card_no, r['result']['number']['text'], f'{image_path} number case error')
			
 
				-
			
 
				-    def test_true_t01(self):
			
 
				-        image_path = '../images/ture/t01.png'
			
 
				-        self._helper(image_path, '000', 1, '6217002580007133039')
			
 
				-
			
 
				-    def test_true_t02(self):
			
 
				-        image_path = '../images/ture/t02.png'
			
 
				-        self._helper(image_path, '000', 0, '6217000410005833061')
			
 
				-
			
 
				-    def test_true_t03(self):
			
 
				-        image_path = '../images/ture/t03.png'
			
 
				-        self._helper(image_path, '000', 0, '6217000940023315733')
			
 
				-
			
 
				-    def test_true_t04(self):
			
 
				-        image_path = '../images/ture/t04.png'
			
 
				-        self._helper(image_path, '000', 1, '6214835665420657')
			
 
				-
			
 
				-    def test_true_t05(self):
			
 
				-        image_path = '../images/ture/t05.png'
			
 
				-        self._helper(image_path, '000', 0, '6217000780063553227')
			
 
				-
			
 
				-    # 以前正确，现在方向错误
			
 
				-    def test_true_t06(self):
			
 
				-        image_path = '../images/ture/t06.png'
			
 
				-        self._helper(image_path, '000', 0, '6230580000168512874')
			
 
				-
			
 
				-    def test_true_t07(self):
			
 
				-        image_path = '../images/ture/t07.png'
			
 
				-        self._helper(image_path, '000', 0, '6216618401001365345')
			
 
				-
			
 
				-    def test_true_t08(self):
			
 
				-        image_path = '../images/ture/t08.jpg'
			
 
				-        self._helper(image_path, '000', 0, '6217000416005548153')
			
 
				-
			
 
				-    def test_true_t09(self):
			
 
				-        image_path = '../images/ture/t09.jpg'
			
 
				-        self._helper(image_path, '000', 0, '6217000416005548146')
			
 
				-
			
 
				-    def test_true_t10(self):
			
 
				-        image_path = '../images/ture/t10.jpg'
			
 
				-        self._helper(image_path, '000', 0, '6217000416000737652')
			
 
				-
			
 
				-    def test_true_t11(self):
			
 
				-        image_path = '../images/ture/t11.png'
			
 
				-        self._helper(image_path, '000', 0, '6214834723639358')
			
 
				-
			
 
				-    def test_true_t12(self):
			
 
				-        image_path = '../images/ture/t12.jpg'
			
 
				-        self._helper(image_path, '000', 0, '6228480878204631674')
			
 
				-
			
 
				-    def test_true_05(self):
			
 
				-        image_path = '../images/ture/05.jpg'
			
 
				-        self._helper(image_path, '000', 0, '6217000416004473577')
			
 
				-
			
 
				-    def test_true_08(self):
			
 
				-        image_path = '../images/ture/08.png'
			
 
				-        self._helper(image_path, '000', 0, '6216618401001365345')
			
 
				-