2 år sedan · 5b1a2188fc
--- a/.gitignore
+++ b/.gitignore
@@ -3,4 +3,5 @@
 
				 .DS_Store
			
 
				 __pycache__
			
 
				 *.pyc
			
 
				-output/
			
 
				+output/
			
 
				+/images/test
			
--- a/Dockerfile
+++ b/Dockerfile
@@ -97,6 +97,9 @@ environment=PYTHONUNBUFFERED=1\n\
 
				 ARG VERSION
			
 
				 ENV USE_CUDA $VERSION
			
 
				 Add . /workspace
			
 
				+RUN cp predict_det.py /opt/conda/envs/py38/lib/python3.8/site-packages/paddleocr/tools/infer/predict_det.py
			
 
				+RUN cp utility.py /opt/conda/envs/py38/lib/python3.8/site-packages/paddleocr/tools/infer/utility.py
			
 
				+
			
 
				 EXPOSE 8080
			
 
				 
			
 
				 
			
--- a/bank_det_infer/inference.pdiparams
+++ b/bank_det_infer/inference.pdiparams
--- a/bank_det_infer/inference.pdiparams.info
+++ b/bank_det_infer/inference.pdiparams.info
--- a/bank_det_infer/inference.pdmodel
+++ b/bank_det_infer/inference.pdmodel
--- a/bank_rec_infer/inference.pdiparams
+++ b/bank_rec_infer/inference.pdiparams
--- a/bank_rec_infer/inference.pdiparams.info
+++ b/bank_rec_infer/inference.pdiparams.info
--- a/bank_rec_infer/inference.pdmodel
+++ b/bank_rec_infer/inference.pdmodel
--- a/convert_markdown.py
+++ b/convert_markdown.py
@@ -0,0 +1,120 @@
 
				+import operator
			
 
				+from pathlib import Path
			
 
				+
			
 
				+import numpy as np
			
 
				+from mdutils.mdutils import MdUtils
			
 
				+import cv2
			
 
				+import requests
			
 
				+import json
			
 
				+import time
			
 
				+import base64
			
 
				+from itertools import chain
			
 
				+
			
 
				+url = 'http://192.168.199.249:28811'
			
 
				+# url = "http://aihub-test.digitalyili.com/aiSquare/openApi/reasoning-services/rlocrxm/xxw/schoolcert"
			
 
				+root = Path(__file__).parent
			
 
				+mdFile = MdUtils(file_name=time.strftime("%m-%d", time.localtime()) + "银行卡")
			
 
				+
			
 
				+print(root)
			
 
				+
			
 
				+
			
 
				+def send_request(img_path, image_type=0, rotate=None):
			
 
				+    # sourcery skip: use-fstring-for-concatenation
			
 
				+    # or_img
			
 
				+    # 创建存旋转照片的目录
			
 
				+    dir = img_path.parent.parent / (".ro_dir")
			
 
				+    if not dir.exists(): dir.mkdir()
			
 
				+
			
 
				+    # 旋转文件存文件
			
 
				+    #   - 读文件
			
 
				+    img = cv2.imread(str(img_path))
			
 
				+    img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
			
 
				+    #   - 旋转保存文件
			
 
				+    # if rotate is not None:
			
 
				+    #     img = cv2.rotate(img, rotate)
			
 
				+    #
			
 
				+    #     angle = "_" + str(rotate + 1)
			
 
				+    #     img_path = dir / (img_path.stem + angle + ".jpg")
			
 
				+    #     img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
			
 
				+    #     cv2.imwrite(str(img_path), img)
			
 
				+
			
 
				+    with img_path.open('rb') as f:
			
 
				+        img_str: str = base64.encodebytes(f.read()).decode('utf-8')
			
 
				+
			
 
				+    # request
			
 
				+    # headers = {
			
 
				+    #     'Authorization': "Bearer 9679c2b3-b90b-4029-a3c7-f347b4d242f7",
			
 
				+    #     'content-type': "application/json"
			
 
				+    # }
			
 
				+    # r = requests.post(url, json={"image": img_str, "image_type": image_type}, headers=headers)
			
 
				+
			
 
				+    r = requests.post(url + '/ocr_system/bankcard', json={"image": img_str, "image_type": image_type})
			
 
				+
			
 
				+
			
 
				+    print(r.json())
			
 
				+    return r.json(), img_path
			
 
				+
			
 
				+
			
 
				+def _parse_result(r):
			
 
				+    if r['status'] == '000':
			
 
				+        r = r['result']
			
 
				+        del r['confidence']
			
 
				+        return {k: v['text'] if isinstance(v, dict) else v for k, v in r.items()}
			
 
				+    elif r['status'] == '101':
			
 
				+        return r['msg']
			
 
				+
			
 
				+
			
 
				+
			
 
				+def compare_dic(dic, dic1, mdimg_path):
			
 
				+    global true_num
			
 
				+    image = mdFile.new_inline_image(text='', path=mdimg_path)
			
 
				+    if operator.eq(dic, dic1):
			
 
				+        true_list.extend([image, dic1])
			
 
				+    elif type(dic1) == dict:
			
 
				+        err_str = ""
			
 
				+        for key in dic:
			
 
				+            if dic[key] != dic1[key]:
			
 
				+                err_str = f"{err_str}正确:{dic[key]}<br>返回:{dic1[key]}<br>"
			
 
				+                true_num = true_num - 1
			
 
				+        false_list.extend([image, err_str])
			
 
				+    elif type(dic1) == str:
			
 
				+        false_list.extend([image, dic1])
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    true_list = ["图片", "识别结果"]
			
 
				+    false_list = ["图片", "识别结果"]
			
 
				+
			
 
				+    # img_paths = chain(*[Path('./images/test/7.28/0').rglob('*.jpg')])
			
 
				+    img_paths = list(chain(*[Path('./images/test/7.28/0').rglob('*.jpg')]))
			
 
				+    true_num = all_num = 2 * len(img_paths)
			
 
				+    # 文件夹里每个图片
			
 
				+    for img_path in img_paths:
			
 
				+        print(img_path)
			
 
				+
			
 
				+        # 打开该图片的json文件
			
 
				+        imgj_path_d = img_path.parent
			
 
				+        imgj_path_n = f'{img_path.stem}.json'
			
 
				+        imgj_path = imgj_path_d / imgj_path_n
			
 
				+        with imgj_path.open('r') as json_f:
			
 
				+            dic_j = json.load(json_f)
			
 
				+
			
 
				+        # 四个方向
			
 
				+        # for (oor, cv2_orr) in {0: None, 1: 0, 2: 1, 3: 2}.items():
			
 
				+        #     r, path = send_request(root / img_path, 0, cv2_orr)
			
 
				+        #     dic_pic = _parse_result(r)
			
 
				+        #     dic_j['orientation'] = oor
			
 
				+        #     compare_dic(dic_j, dic_pic, str(path))
			
 
				+        r, path = send_request(root / img_path, 0, 0)
			
 
				+        dic_pic = _parse_result(r)
			
 
				+        compare_dic(dic_j, dic_pic, str(path))
			
 
				+
			
 
				+    mdFile.new_header(level=1, title='测试正确率')
			
 
				+    mdFile.new_paragraph("{:.2f}%".format(true_num / all_num * 100))
			
 
				+    mdFile.new_header(level=1, title='True')
			
 
				+    mdFile.new_table(columns=2, rows=len(true_list) // 2, text=true_list, text_align='center')
			
 
				+
			
 
				+    mdFile.new_header(level=1, title='False')
			
 
				+    mdFile.new_table(columns=2, rows=len(false_list) // 2, text=false_list, text_align='center')
			
 
				+
			
 
				+    mdFile.create_md_file()
			
--- a/core/anchor.py
+++ b/core/anchor.py
@@ -71,7 +71,7 @@ class OcrAnchor(object):
 
				         return (l + r) / 2, (t + b) / 2
			
 
				 
			
 
				     # 判断是否是 锚点
			
 
				-    def is_anchor(self, txt, box) -> bool:
			
 
				+    def is_anchor(self, txt, box, conf) -> bool:
			
 
				         pass
			
 
				 
			
 
				     # 找 锚点 -> 锚点坐标
			
@@ -83,10 +83,22 @@ class OcrAnchor(object):
 
				             for r in row:
			
 
				                 txt = r.txt.replace('-', '').replace(' ', '')
			
 
				                 box = r.box
			
 
				-                if self.is_anchor(txt, box):
			
 
				+                conf = r.conf
			
 
				+                flag = self.is_anchor(txt, box, conf)
			
 
				+                if flag:
			
 
				                     l, t = np.min(box, 0)
			
 
				                     r, b = np.max(box, 0)
			
 
				                     return True, (l + r) / 2, (t + b) / 2
			
 
				+        #         if flag and (len(re.findall('\d{10,20}', txt)) > 0 and conf > 0.95):
			
 
				+        #             l, t = np.min(box, 0)
			
 
				+        #             r, b = np.max(box, 0)
			
 
				+        #             return True, (l + r) / 2, (t + b) / 2
			
 
				+        #         elif flag:
			
 
				+        #             l, t = np.min(box, 0)
			
 
				+        #             r, b = np.max(box, 0)
			
 
				+        # if l:
			
 
				+        #     return True, (l + r) / 2, (t + b) / 2
			
 
				+        # else:
			
 
				         return False, 0., 0.
			
 
				 
			
 
				     # 定位 锚点 -> 角度
			
@@ -97,8 +109,6 @@ class OcrAnchor(object):
 
				         # 如果识别不到身份证号
			
 
				         if not found: raise Exception(f'识别不到anchor{self.name}')
			
 
				         cx, cy = self.get_rec_area(res)
			
 
				-        # print(f'id_cx: {id_cx}, id_cy: {id_cy}')
			
 
				-        # print(f'cx: {cx}, cy: {cy}')
			
 
				         pre = None
			
 
				         for d in self.direction:
			
 
				             f = self.direction_funcs.get(d, None)
			
@@ -115,10 +125,28 @@ class BankCardAnchor(OcrAnchor):
 
				     def __init__(self, name: str, d: List[Direction]):
			
 
				         super(BankCardAnchor, self).__init__(name, d)
			
 
				 
			
 
				-    def is_anchor(self, txt, box) -> bool:
			
 
				-        txts = re.findall('\d{10,20}', txt)
			
 
				-        if len(txts) > 0:
			
 
				+    def is_anchor(self, txt, box, conf) -> bool:
			
 
				+        # # 这边我动了手脚，可能需要改一下长度，到时候测试再看
			
 
				+        # txts = re.findall('\d{5,20}', txt)
			
 
				+        # # print(txts)
			
 
				+        # if conf > 0.95 and len(txts) > 0:
			
 
				+        #     # print("这是我识别出来的卡号：", txts)
			
 
				+        #     return True
			
 
				+
			
 
				+        # 这里逻辑有点长，理想情况下，置信度比较高的txt会在卡号附近，一般在卡号下方
			
 
				+        if len(re.findall('\d{16,20}', txt)) > 0 and conf > 0.95:  # 完美找到卡号
			
 
				+            return True
			
 
				+        elif len(re.findall('\d{10,16}', txt)) > 0 and conf > 0.95:  # 卡号只找到了一半多点
			
 
				+            return True
			
 
				+        elif len(re.findall('\d{6,10}', txt)) > 0 and conf > 0.95:  # 卡号 只找到了一点
			
 
				             return True
			
 
				+        elif len(re.findall('\d{4,6}', txt)) > 0 and conf > 0.95:  # 卡号只找到了一丢丢
			
 
				+            return True
			
 
				+        elif conf > 0.95:  # 可能卡号就是找到了一个数字，但是置信度很高，
			
 
				+            return True
			
 
				+        # elif conf >= 0.9:
			
 
				+        #     return True
			
 
				+
			
 
				         return False
			
 
				 
			
 
				     def locate_anchor(self, res, is_horizontal) -> int:
			
--- a/core/direction.py
+++ b/core/direction.py
@@ -24,7 +24,6 @@ class AngleDetector(object):
 
				 
			
 
				     def detect_angle(self, img):
			
 
				         ocr_anchor = BankCardAnchor('银行卡号', [Direction.BOTTOM])
			
 
				-
			
 
				         result = self.ocr.ocr(img, cls=True)
			
 
				 
			
 
				         try:
			
@@ -32,6 +31,7 @@ class AngleDetector(object):
 
				             return angle, result
			
 
				 
			
 
				         except Exception as e:
			
 
				+            print("direction.py这里有异常。。。。。。")
			
 
				             print(e)
			
 
				             # 如果第一次识别不到，旋转90度再识别
			
 
				             img = cv2.rotate(img, cv2.ROTATE_90_CLOCKWISE)
			
@@ -39,3 +39,8 @@ class AngleDetector(object):
 
				             angle = detect_angle(result, ocr_anchor)
			
 
				             # 旋转90度之后要重新计算角度
			
 
				             return (angle - 1 + 4) % 4, result
			
 
				+
			
 
				+    def origin_detect(self, img):
			
 
				+        # 这边一般是在自己的检测模型result=[]时，再使用官方的模型做个检测，如果这个也没有结果，那就真的检测不出来
			
 
				+        result = self.ocr.ocr(img)
			
 
				+        return result
			
--- a/core/line_parser.py
+++ b/core/line_parser.py
@@ -1,6 +1,7 @@
 
				 from dataclasses import dataclass
			
 
				 import numpy as np
			
 
				 
			
 
				+
			
 
				 # result 对象
			
 
				 @dataclass
			
 
				 class OcrResult(object):
			
@@ -45,6 +46,7 @@ class OcrResult(object):
 
				         dist = abs(self.center[y_idx] - b.center[y_idx])
			
 
				         return dist < eps
			
 
				 
			
 
				+
			
 
				 # 行处理器
			
 
				 class LineParser(object):
			
 
				     def __init__(self, ocr_raw_result):
			
@@ -78,8 +80,8 @@ class LineParser(object):
 
				         length = len(self.ocr_res)
			
 
				 
			
 
				         # 如果字段数 小于等于1 就抛出异常
			
 
				-        if length <= 1:
			
 
				-            raise Exception('无法识别')
			
 
				+        # if length <= 1:
			
 
				+        #     raise Exception('无法识别')
			
 
				 
			
 
				         # 遍历数组 并处理他
			
 
				         for i in range(length):
			
@@ -100,4 +102,4 @@ class LineParser(object):
 
				                     res_row.add(res_j)
			
 
				             res.append(res_row)
			
 
				         idx = self.is_horizontal + 0
			
 
				-        return sorted([sorted(list(r), key=lambda x: x.lt[1-idx]) for r in res], key=lambda x: x[0].lt[idx])
			
 
				+        return sorted([sorted(list(r), key=lambda x: x.lt[1 - idx]) for r in res], key=lambda x: x[0].lt[idx])
			
--- a/core/ocr.py
+++ b/core/ocr.py
@@ -1,12 +1,14 @@
 
				 from dataclasses import dataclass
			
 
				 
			
 
				 import numpy as np
			
 
				-from paddleocr import PaddleOCR
			
 
				+from paddleocr import PaddleOCR, draw_ocr
			
 
				 
			
 
				 from core.direction import *
			
 
				 from core.line_parser import LineParser
			
 
				 from core.parser import *
			
 
				 
			
 
				+from PIL import Image
			
 
				+
			
 
				 
			
 
				 @dataclass
			
 
				 class BankOcr:
			
@@ -14,19 +16,29 @@ class BankOcr:
 
				     angle_detector: AngleDetector
			
 
				 
			
 
				     def predict(self, image: np.ndarray):
			
 
				-        image, angle, result = self._pre_process(image)
			
 
				+        image, angle, ori_result = self._pre_process(image)
			
 
				         print(f'---------- detect angle: {angle} 角度 --------')
			
 
				-        if angle != 0:
			
 
				-            # 角度不为0需要重新识别,字面
			
 
				-            _, _, result = self._ocr(image)
			
 
				+        # 这里使用自己训练的检测识别模型，在此之前，理想情况下，所有的银行卡的角度都已经是0，（正向）
			
 
				+        _, _, result = self._ocr(image)
			
 
				+
			
 
				+        # self.imshow(image, result)  # 将检测图片保存
			
 
				         return self._post_process(result, angle)
			
 
				 
			
 
				+    def imshow(self, image, result):
			
 
				+        img = Image.fromarray(image).convert("RGB")
			
 
				+        boxes = [line[0] for line in result]
			
 
				+        txts = [line[1][0] for line in result]
			
 
				+        scores = [line[1][1] for line in result]
			
 
				+        im_show = draw_ocr(img, boxes, txts, scores, font_path="./simfang.ttf")
			
 
				+        im_show = Image.fromarray(im_show)
			
 
				+        im_show.save("./img.jpg")
			
 
				+
			
 
				     def _pre_process(self, image: np.ndarray):
			
 
				         angle, result = self.angle_detector.detect_angle(image)
			
 
				 
			
 
				         if angle == 1:
			
 
				             image = cv2.rotate(image, cv2.ROTATE_90_COUNTERCLOCKWISE)
			
 
				-        print(angle)  # 逆时针
			
 
				+        # print("检测出来的角度：", angle)  # 逆时针
			
 
				         if angle == 2:
			
 
				             image = cv2.rotate(image, cv2.ROTATE_180)
			
 
				         if angle == 3:
			
@@ -35,20 +47,62 @@ class BankOcr:
 
				         return image, angle, result
			
 
				 
			
 
				     def _ocr(self, image):
			
 
				-        # 获取模型检测结果
			
 
				-        result = self.ocr.ocr(image, cls=True)
			
 
				+        # 获取模型检测结果,因为是正的照片了，所以不需要方向分类器
			
 
				+        result = self.ocr.ocr(image, cls=False)
			
 
				         print("------------------")
			
 
				-        print(result)
			
 
				+        print("result:", result)
			
 
				+        print("------------------")
			
 
				+
			
 
				+        # result=[] 就用官方再检测
			
 
				         if not result:
			
 
				-            raise Exception('无法识别')
			
 
				-        confs = [line[1][1] for line in result]
			
 
				+            print("需要再次进行官方的检测代码。。。。。。。。。。。。")
			
 
				+            result = self.angle_detector.origin_detect(image)
			
 
				+            # 如果还是空，那就检测不出来
			
 
				+            if not result:
			
 
				+                raise Exception('经过两次检测都无法识别！！！')
			
 
				+
			
 
				+            confs = [line[1][1] for line in result]
			
 
				+            txts = [line[1][0] for line in result]
			
 
				+            return txts, confs, result
			
 
				 
			
 
				+        # result!=[] 就判断一些规则
			
 
				+        if result:
			
 
				+            confs = [line[1][1] for line in result]
			
 
				+            print("自己的检测模型得到的conf：", confs)
			
 
				+            if len(result) == 2 and all(map(lambda x: x > 0.975, confs)):
			
 
				+                l_box, r_box = [], []
			
 
				+                l_box.extend(result[0][0])
			
 
				+                r_box.extend(result[1][0])
			
 
				+
			
 
				+                l_max, _ = np.max(l_box, 0)
			
 
				+                r_min, _ = np.min(r_box, 0)
			
 
				+
			
 
				+                if l_max > r_min:
			
 
				+                    print("说明自己的检测模型不好")
			
 
				+                    result = self.angle_detector.origin_detect(image)
			
 
				+            else:
			
 
				+                # 一般情况下，len=1
			
 
				+                flag = 0
			
 
				+                if map(lambda x: x >= 0.975, confs):
			
 
				+                    flag = 1
			
 
				+                # for conf in confs:
			
 
				+                #     if conf >= 0.975:
			
 
				+                #         flag = 1
			
 
				+                #         break
			
 
				+                if flag == 0:
			
 
				+                    print("需要再次进行官方的检测代码。。。。。。。。。。。。")
			
 
				+                    result = self.angle_detector.origin_detect(image)
			
 
				+
			
 
				+        # 如果还是空，那就检测不出来
			
 
				+        if not result:
			
 
				+            raise Exception('经过两次检测都无法识别！！！')
			
 
				+
			
 
				+        confs = [line[1][1] for line in result]
			
 
				         # 将检测到的文字放到一个列表中
			
 
				         txts = [line[1][0] for line in result]
			
 
				         return txts, confs, result
			
 
				 
			
 
				     def _post_process(self, raw_result, angle: int):
			
 
				-
			
 
				         # 把测试图片 喂给 OCR 返回给 self.raw_results
			
 
				         line_parser = LineParser(raw_result)
			
 
				         line_results = line_parser.parse()
			
--- a/core/parser.py
+++ b/core/parser.py
@@ -19,49 +19,39 @@ class RecItem:
 
				 
			
 
				 
			
 
				 def find_card_row(line_results):
			
 
				-    res = None
			
 
				+    print('~~~~line results~~~~~')
			
 
				     for row in line_results:
			
 
				-        row = sorted(row, key=lambda x: x.lt[0])
			
 
				-        txt = [r.txt.replace(' ', '').replace('.', '') for r in row]
			
 
				+        print('++++')
			
 
				+        print(row)
			
 
				+    print('~~~~line results~~~~~')
			
 
				+
			
 
				+    new_lines = []
			
 
				+    for row in line_results:
			
 
				+        new_line = []
			
 
				+        for r in row:
			
 
				+            if r.conf > 0.93:
			
 
				+                new_line.append(r)
			
 
				+        if new_line:
			
 
				+            new_lines.append(new_line)
			
 
				+
			
 
				+    print('~~~~new line results~~~~~')
			
 
				+    for row in new_lines:
			
 
				+        print('++++')
			
 
				+        print(row)
			
 
				+    print('~~~~new line results~~~~~')
			
 
				+    line_results = new_lines
			
 
				+
			
 
				+    for row in line_results:
			
 
				+        txt = [r.txt.replace(' ', '') for r in row]
			
 
				         conf = np.mean([r.conf for r in row])
			
 
				-        lts = [r.lt for r in row]
			
 
				-        rbs = [r.rb for r in row]
			
 
				-        lt = np.min(np.stack(lts), 0)
			
 
				-        rb = np.max(np.stack(rbs), 0)
			
 
				         txt = ''.join(txt)
			
 
				         res = re.findall('\d{15,20}', txt)
			
 
				-        if res:
			
 
				-            return row, res[0], conf, lt.astype(np.int).tolist(), rb.astype(np.int).tolist()
			
 
				-    if not res:
			
 
				-        res_lt, res_rb = None, None
			
 
				-        row_res = 0
			
 
				-        max_w, max_h = 0, 0
			
 
				-        conf_res = 0.
			
 
				-        for row in line_results:
			
 
				-            txt = ''.join([r.txt.replace(' ', '').replace('.', '') for r in row])
			
 
				-            conf = np.mean([r.conf for r in row])
			
 
				-            print(txt)
			
 
				-            if not txt.isascii(): continue
			
 
				-            lts = [r.lt for r in row]
			
 
				-            rbs = [r.rb for r in row]
			
 
				-            lt = np.min(np.stack(lts), 0)
			
 
				-            rb = np.max(np.stack(rbs), 0)
			
 
				-            print(lt, rb, '-------')
			
 
				-            w, h = (rb - lt).astype(np.int).tolist()
			
 
				-            print(w, h, '-------')
			
 
				-            if w > max_w:
			
 
				-                row_res = row
			
 
				-                max_w, max_h = w, h
			
 
				-                res_lt, res_rb = lt, rb
			
 
				-                conf_res = conf
			
 
				-        res = re.findall('\d{15,20}', txt)
			
 
				-        if res:
			
 
				-            return row_res, txt, conf_res, res_lt.astype(np.int).tolist(), res_rb.astype(np.int).tolist()
			
 
				-        else:
			
 
				-            print('无法识别', txt)
			
 
				-
			
 
				+        print(f'res: {res}, conf: {conf}')
			
 
				+        if res and conf > 0.95:
			
 
				+            return row, res[0], conf
			
 
				     raise Exception('无法识别')
			
 
				 
			
 
				+
			
 
				 def handle_wrong_digits(s):
			
 
				     s = s.replace(' ', '')
			
 
				     s = s.replace('-', '')
			
@@ -74,6 +64,7 @@ def handle_wrong_digits(s):
 
				         s = '6' + s[1:]
			
 
				     return s
			
 
				 
			
 
				+
			
 
				 class Parser(object):
			
 
				     def __init__(self, line_results: List[List[OcrResult]]):
			
 
				         self.line_results = line_results
			
@@ -82,13 +73,11 @@ class Parser(object):
 
				 
			
 
				     def bank_no(self):
			
 
				         # 号码
			
 
				-        row, txt, conf, lt, rb = find_card_row(self.line_results)
			
 
				+        row, txt, conf = find_card_row(self.line_results)
			
 
				         print(f'=== txt: {txt}, res: {row}======')
			
 
				         txt = handle_wrong_digits(txt)
			
 
				         self.res['number'] = RecItem(txt, conf)
			
 
				 
			
 
				-
			
 
				-
			
 
				     def parse(self):
			
 
				         self.bank_no()
			
 
				         return self.res
			
--- a/cpu.Dockerfile
+++ b/cpu.Dockerfile
@@ -95,6 +95,9 @@ stdout_logfile_maxbytes=0\n\
 
				 ARG VERSION
			
 
				 ENV USE_CUDA $VERSION
			
 
				 Add . /workspace
			
 
				+RUN cp predict_det.py /opt/conda/envs/py38/lib/python3.8/site-packages/paddleocr/tools/infer/predict_det.py
			
 
				+RUN cp utility.py /opt/conda/envs/py38/lib/python3.8/site-packages/paddleocr/tools/infer/utility.py
			
 
				+
			
 
				 EXPOSE 8080
			
 
				 
			
 
				 
			
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -10,12 +10,12 @@ services:
 
				     tty: true
			
 
				     working_dir: /workspace
			
 
				     ports:
			
 
				-      - '18081:8080'
			
 
				-      - '18223:22'
			
 
				+      - '28811:8080'
			
 
				+      - '222:22'
			
 
				     volumes:
			
 
				       - ./:/workspace
			
 
				-    deploy:
			
 
				-      resources:
			
 
				-        reservations:
			
 
				-          devices:
			
 
				-            - capabilities: [gpu]
			
 
				+#    deploy:
			
 
				+#      resources:
			
 
				+#        reservations:
			
 
				+#          devices:
			
 
				+#            - capabilities: [gpu]
			
--- a/en_dict.txt
+++ b/en_dict.txt
@@ -0,0 +1,95 @@
 
				+0
			
 
				+1
			
 
				+2
			
 
				+3
			
 
				+4
			
 
				+5
			
 
				+6
			
 
				+7
			
 
				+8
			
 
				+9
			
 
				+:
			
 
				+;
			
 
				+<
			
 
				+=
			
 
				+>
			
 
				+?
			
 
				+@
			
 
				+A
			
 
				+B
			
 
				+C
			
 
				+D
			
 
				+E
			
 
				+F
			
 
				+G
			
 
				+H
			
 
				+I
			
 
				+J
			
 
				+K
			
 
				+L
			
 
				+M
			
 
				+N
			
 
				+O
			
 
				+P
			
 
				+Q
			
 
				+R
			
 
				+S
			
 
				+T
			
 
				+U
			
 
				+V
			
 
				+W
			
 
				+X
			
 
				+Y
			
 
				+Z
			
 
				+[
			
 
				+\
			
 
				+]
			
 
				+^
			
 
				+_
			
 
				+`
			
 
				+a
			
 
				+b
			
 
				+c
			
 
				+d
			
 
				+e
			
 
				+f
			
 
				+g
			
 
				+h
			
 
				+i
			
 
				+j
			
 
				+k
			
 
				+l
			
 
				+m
			
 
				+n
			
 
				+o
			
 
				+p
			
 
				+q
			
 
				+r
			
 
				+s
			
 
				+t
			
 
				+u
			
 
				+v
			
 
				+w
			
 
				+x
			
 
				+y
			
 
				+z
			
 
				+{
			
 
				+|
			
 
				+}
			
 
				+~
			
 
				+!
			
 
				+"
			
 
				+#
			
 
				+$
			
 
				+%
			
 
				+&
			
 
				+'
			
 
				+(
			
 
				+)
			
 
				+*
			
 
				++
			
 
				+,
			
 
				+-
			
 
				+.
			
 
				+/
			
 
				+ 
			
--- a/ppocr_keys_bank.txt
+++ b/ppocr_keys_bank.txt
@@ -7,4 +7,4 @@
 
				 6
			
 
				 7
			
 
				 8
			
 
				-9
			
 
				+9
			
--- a/predict_det.py
+++ b/predict_det.py
@@ -0,0 +1,303 @@
 
				+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+import os
			
 
				+import sys
			
 
				+
			
 
				+__dir__ = os.path.dirname(os.path.abspath(__file__))
			
 
				+sys.path.append(__dir__)
			
 
				+sys.path.insert(0, os.path.abspath(os.path.join(__dir__, '../..')))
			
 
				+
			
 
				+os.environ["FLAGS_allocator_strategy"] = 'auto_growth'
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import time
			
 
				+import sys
			
 
				+
			
 
				+import tools.infer.utility as utility
			
 
				+from ppocr.utils.logging import get_logger
			
 
				+from ppocr.utils.utility import get_image_file_list, check_and_read_gif
			
 
				+from ppocr.data import create_operators, transform
			
 
				+from ppocr.postprocess import build_post_process
			
 
				+import json
			
 
				+logger = get_logger()
			
 
				+
			
 
				+
			
 
				+class TextDetector(object):
			
 
				+    def __init__(self, args):
			
 
				+        self.args = args
			
 
				+        self.det_algorithm = args.det_algorithm
			
 
				+        self.use_onnx = args.use_onnx
			
 
				+        pre_process_list = [{
			
 
				+            'DetResizeForTest': {
			
 
				+                # 'limit_side_len': args.det_limit_side_len,
			
 
				+                # 'limit_type': args.det_limit_type,
			
 
				+                'resize_long': args.det_resize_long
			
 
				+            }
			
 
				+        }, {
			
 
				+            'NormalizeImage': {
			
 
				+                'std': [0.229, 0.224, 0.225],
			
 
				+                'mean': [0.485, 0.456, 0.406],
			
 
				+                'scale': '1./255.',
			
 
				+                'order': 'hwc'
			
 
				+            }
			
 
				+        }, {
			
 
				+            'ToCHWImage': None
			
 
				+        }, {
			
 
				+            'KeepKeys': {
			
 
				+                'keep_keys': ['image', 'shape']
			
 
				+            }
			
 
				+        }]
			
 
				+        postprocess_params = {}
			
 
				+        if self.det_algorithm == "DB":
			
 
				+            postprocess_params['name'] = 'DBPostProcess'
			
 
				+            postprocess_params["thresh"] = args.det_db_thresh
			
 
				+            postprocess_params["box_thresh"] = args.det_db_box_thresh
			
 
				+            postprocess_params["max_candidates"] = 1000
			
 
				+            postprocess_params["unclip_ratio"] = args.det_db_unclip_ratio
			
 
				+            postprocess_params["use_dilation"] = args.use_dilation
			
 
				+            postprocess_params["score_mode"] = args.det_db_score_mode
			
 
				+        elif self.det_algorithm == "EAST":
			
 
				+            postprocess_params['name'] = 'EASTPostProcess'
			
 
				+            postprocess_params["score_thresh"] = args.det_east_score_thresh
			
 
				+            postprocess_params["cover_thresh"] = args.det_east_cover_thresh
			
 
				+            postprocess_params["nms_thresh"] = args.det_east_nms_thresh
			
 
				+        elif self.det_algorithm == "SAST":
			
 
				+            pre_process_list[0] = {
			
 
				+                'DetResizeForTest': {
			
 
				+                    'resize_long': args.det_limit_side_len
			
 
				+                }
			
 
				+            }
			
 
				+            postprocess_params['name'] = 'SASTPostProcess'
			
 
				+            postprocess_params["score_thresh"] = args.det_sast_score_thresh
			
 
				+            postprocess_params["nms_thresh"] = args.det_sast_nms_thresh
			
 
				+            self.det_sast_polygon = args.det_sast_polygon
			
 
				+            if self.det_sast_polygon:
			
 
				+                postprocess_params["sample_pts_num"] = 6
			
 
				+                postprocess_params["expand_scale"] = 1.2
			
 
				+                postprocess_params["shrink_ratio_of_width"] = 0.2
			
 
				+            else:
			
 
				+                postprocess_params["sample_pts_num"] = 2
			
 
				+                postprocess_params["expand_scale"] = 1.0
			
 
				+                postprocess_params["shrink_ratio_of_width"] = 0.3
			
 
				+        elif self.det_algorithm == "PSE":
			
 
				+            postprocess_params['name'] = 'PSEPostProcess'
			
 
				+            postprocess_params["thresh"] = args.det_pse_thresh
			
 
				+            postprocess_params["box_thresh"] = args.det_pse_box_thresh
			
 
				+            postprocess_params["min_area"] = args.det_pse_min_area
			
 
				+            postprocess_params["box_type"] = args.det_pse_box_type
			
 
				+            postprocess_params["scale"] = args.det_pse_scale
			
 
				+            self.det_pse_box_type = args.det_pse_box_type
			
 
				+        elif self.det_algorithm == "FCE":
			
 
				+            pre_process_list[0] = {
			
 
				+                'DetResizeForTest': {
			
 
				+                    'rescale_img': [1080, 736]
			
 
				+                }
			
 
				+            }
			
 
				+            postprocess_params['name'] = 'FCEPostProcess'
			
 
				+            postprocess_params["scales"] = args.scales
			
 
				+            postprocess_params["alpha"] = args.alpha
			
 
				+            postprocess_params["beta"] = args.beta
			
 
				+            postprocess_params["fourier_degree"] = args.fourier_degree
			
 
				+            postprocess_params["box_type"] = args.det_fce_box_type
			
 
				+        else:
			
 
				+            logger.info("unknown det_algorithm:{}".format(self.det_algorithm))
			
 
				+            sys.exit(0)
			
 
				+
			
 
				+        self.preprocess_op = create_operators(pre_process_list)
			
 
				+        self.postprocess_op = build_post_process(postprocess_params)
			
 
				+        self.predictor, self.input_tensor, self.output_tensors, self.config = utility.create_predictor(
			
 
				+            args, 'det', logger)
			
 
				+
			
 
				+        if self.use_onnx:
			
 
				+            img_h, img_w = self.input_tensor.shape[2:]
			
 
				+            if img_h is not None and img_w is not None and img_h > 0 and img_w > 0:
			
 
				+                pre_process_list[0] = {
			
 
				+                    'DetResizeForTest': {
			
 
				+                        'image_shape': [img_h, img_w]
			
 
				+                    }
			
 
				+                }
			
 
				+        self.preprocess_op = create_operators(pre_process_list)
			
 
				+
			
 
				+        if args.benchmark:
			
 
				+            import auto_log
			
 
				+            pid = os.getpid()
			
 
				+            gpu_id = utility.get_infer_gpuid()
			
 
				+            self.autolog = auto_log.AutoLogger(
			
 
				+                model_name="det",
			
 
				+                model_precision=args.precision,
			
 
				+                batch_size=1,
			
 
				+                data_shape="dynamic",
			
 
				+                save_path=None,
			
 
				+                inference_config=self.config,
			
 
				+                pids=pid,
			
 
				+                process_name=None,
			
 
				+                gpu_ids=gpu_id if args.use_gpu else None,
			
 
				+                time_keys=[
			
 
				+                    'preprocess_time', 'inference_time', 'postprocess_time'
			
 
				+                ],
			
 
				+                warmup=2,
			
 
				+                logger=logger)
			
 
				+
			
 
				+    def order_points_clockwise(self, pts):
			
 
				+        rect = np.zeros((4, 2), dtype="float32")
			
 
				+        s = pts.sum(axis=1)
			
 
				+        rect[0] = pts[np.argmin(s)]
			
 
				+        rect[2] = pts[np.argmax(s)]
			
 
				+        diff = np.diff(pts, axis=1)
			
 
				+        rect[1] = pts[np.argmin(diff)]
			
 
				+        rect[3] = pts[np.argmax(diff)]
			
 
				+        return rect
			
 
				+
			
 
				+    def clip_det_res(self, points, img_height, img_width):
			
 
				+        for pno in range(points.shape[0]):
			
 
				+            points[pno, 0] = int(min(max(points[pno, 0], 0), img_width - 1))
			
 
				+            points[pno, 1] = int(min(max(points[pno, 1], 0), img_height - 1))
			
 
				+        return points
			
 
				+
			
 
				+    def filter_tag_det_res(self, dt_boxes, image_shape):
			
 
				+        img_height, img_width = image_shape[0:2]
			
 
				+        dt_boxes_new = []
			
 
				+        for box in dt_boxes:
			
 
				+            box = self.order_points_clockwise(box)
			
 
				+            box = self.clip_det_res(box, img_height, img_width)
			
 
				+            rect_width = int(np.linalg.norm(box[0] - box[1]))
			
 
				+            rect_height = int(np.linalg.norm(box[0] - box[3]))
			
 
				+            if rect_width <= 3 or rect_height <= 3:
			
 
				+                continue
			
 
				+            dt_boxes_new.append(box)
			
 
				+        dt_boxes = np.array(dt_boxes_new)
			
 
				+        return dt_boxes
			
 
				+
			
 
				+    def filter_tag_det_res_only_clip(self, dt_boxes, image_shape):
			
 
				+        img_height, img_width = image_shape[0:2]
			
 
				+        dt_boxes_new = []
			
 
				+        for box in dt_boxes:
			
 
				+            box = self.clip_det_res(box, img_height, img_width)
			
 
				+            dt_boxes_new.append(box)
			
 
				+        dt_boxes = np.array(dt_boxes_new)
			
 
				+        return dt_boxes
			
 
				+
			
 
				+    def __call__(self, img):
			
 
				+        ori_im = img.copy()
			
 
				+        data = {'image': img}
			
 
				+
			
 
				+        st = time.time()
			
 
				+
			
 
				+        if self.args.benchmark:
			
 
				+            self.autolog.times.start()
			
 
				+
			
 
				+        data = transform(data, self.preprocess_op)
			
 
				+        img, shape_list = data
			
 
				+        if img is None:
			
 
				+            return None, 0
			
 
				+        img = np.expand_dims(img, axis=0)
			
 
				+        shape_list = np.expand_dims(shape_list, axis=0)
			
 
				+        img = img.copy()
			
 
				+
			
 
				+        if self.args.benchmark:
			
 
				+            self.autolog.times.stamp()
			
 
				+        if self.use_onnx:
			
 
				+            input_dict = {}
			
 
				+            input_dict[self.input_tensor.name] = img
			
 
				+            outputs = self.predictor.run(self.output_tensors, input_dict)
			
 
				+        else:
			
 
				+            self.input_tensor.copy_from_cpu(img)
			
 
				+            self.predictor.run()
			
 
				+            outputs = []
			
 
				+            for output_tensor in self.output_tensors:
			
 
				+                output = output_tensor.copy_to_cpu()
			
 
				+                outputs.append(output)
			
 
				+            if self.args.benchmark:
			
 
				+                self.autolog.times.stamp()
			
 
				+
			
 
				+        preds = {}
			
 
				+        if self.det_algorithm == "EAST":
			
 
				+            preds['f_geo'] = outputs[0]
			
 
				+            preds['f_score'] = outputs[1]
			
 
				+        elif self.det_algorithm == 'SAST':
			
 
				+            preds['f_border'] = outputs[0]
			
 
				+            preds['f_score'] = outputs[1]
			
 
				+            preds['f_tco'] = outputs[2]
			
 
				+            preds['f_tvo'] = outputs[3]
			
 
				+        elif self.det_algorithm in ['DB', 'PSE']:
			
 
				+            preds['maps'] = outputs[0]
			
 
				+        elif self.det_algorithm == 'FCE':
			
 
				+            for i, output in enumerate(outputs):
			
 
				+                preds['level_{}'.format(i)] = output
			
 
				+        else:
			
 
				+            raise NotImplementedError
			
 
				+
			
 
				+        #self.predictor.try_shrink_memory()
			
 
				+        post_result = self.postprocess_op(preds, shape_list)
			
 
				+        dt_boxes = post_result[0]['points']
			
 
				+        if (self.det_algorithm == "SAST" and self.det_sast_polygon) or (
			
 
				+                self.det_algorithm in ["PSE", "FCE"] and
			
 
				+                self.postprocess_op.box_type == 'poly'):
			
 
				+            dt_boxes = self.filter_tag_det_res_only_clip(dt_boxes, ori_im.shape)
			
 
				+        else:
			
 
				+            dt_boxes = self.filter_tag_det_res(dt_boxes, ori_im.shape)
			
 
				+
			
 
				+        if self.args.benchmark:
			
 
				+            self.autolog.times.end(stamp=True)
			
 
				+        et = time.time()
			
 
				+        return dt_boxes, et - st
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    args = utility.parse_args()
			
 
				+    image_file_list = get_image_file_list(args.image_dir)
			
 
				+    text_detector = TextDetector(args)
			
 
				+    count = 0
			
 
				+    total_time = 0
			
 
				+    draw_img_save = "./inference_results"
			
 
				+
			
 
				+    if args.warmup:
			
 
				+        img = np.random.uniform(0, 255, [640, 640, 3]).astype(np.uint8)
			
 
				+        for i in range(2):
			
 
				+            res = text_detector(img)
			
 
				+
			
 
				+    if not os.path.exists(draw_img_save):
			
 
				+        os.makedirs(draw_img_save)
			
 
				+    save_results = []
			
 
				+    for image_file in image_file_list:
			
 
				+        img, flag = check_and_read_gif(image_file)
			
 
				+        if not flag:
			
 
				+            img = cv2.imread(image_file)
			
 
				+        if img is None:
			
 
				+            logger.info("error in loading image:{}".format(image_file))
			
 
				+            continue
			
 
				+        st = time.time()
			
 
				+        dt_boxes, _ = text_detector(img)
			
 
				+        elapse = time.time() - st
			
 
				+        if count > 0:
			
 
				+            total_time += elapse
			
 
				+        count += 1
			
 
				+        save_pred = os.path.basename(image_file) + "\t" + str(
			
 
				+            json.dumps([x.tolist() for x in dt_boxes])) + "\n"
			
 
				+        save_results.append(save_pred)
			
 
				+        logger.info(save_pred)
			
 
				+        logger.info("The predict time of {}: {}".format(image_file, elapse))
			
 
				+        src_im = utility.draw_text_det_res(dt_boxes, image_file)
			
 
				+        img_name_pure = os.path.split(image_file)[-1]
			
 
				+        img_path = os.path.join(draw_img_save,
			
 
				+                                "det_res_{}".format(img_name_pure))
			
 
				+        cv2.imwrite(img_path, src_im)
			
 
				+        logger.info("The visualized image saved in {}".format(img_path))
			
 
				+
			
 
				+    with open(os.path.join(draw_img_save, "det_results.txt"), 'w') as f:
			
 
				+        f.writelines(save_results)
			
 
				+        f.close()
			
 
				+    if args.benchmark:
			
 
				+        text_detector.autolog.report()
			
--- a/run.py
+++ b/run.py
@@ -7,6 +7,5 @@ if __name__ == '__main__':
 
				     parser.add_argument('--port', default=8080)
			
 
				     opt = parser.parse_args()
			
 
				 
			
 
				-
			
 
				     app_str = 'server:app'  # make the app string equal to whatever the name of this file is
			
 
				     uvicorn.run(app_str, host=opt.host, port=int(opt.port), reload=True, log_level='debug', workers=1)
			
--- a/server.py
+++ b/server.py
@@ -34,21 +34,39 @@ print(f'use gpu: {use_gpu}')
 
				 #                 rec_model_dir="./bank_rec_infer/",
			
 
				 #                 det_model_dir="./bank_det_infer/",
			
 
				 #                 cls_model_dir="./bank_cls_infer/",
			
 
				-#                 rec_algorithm='CRNN',
			
 
				-#                 # rec_image_shape='3, 32, 320',
			
 
				-#                 ocr_version='PP-OCRv2',
			
 
				-#                 rec_char_dict_path="./ppocr_keys_v1.txt",
			
 
				+#                 # rec_algorithm='SVTR_LCNet',
			
 
				+#                 rec_image_shape='3, 48, 320',
			
 
				+#                 # ocr_version='PP-OCRv2',
			
 
				+#                 rec_char_dict_path="./ppocr_keys_bank.txt",
			
 
				 #                 use_gpu=use_gpu,
			
 
				 #                 save_crop_res=True,
			
 
				 #                 warmup=True)
			
 
				 
			
 
				+
			
 
				 ocr = PaddleOCR(use_angle_cls=True,
			
 
				                 use_gpu=use_gpu,
			
 
				                 det_db_unclip_ratio=2.5,
			
 
				-                det_db_thresh=0.1,
			
 
				-                det_db_box_thresh=0.4,
			
 
				-                # save_crop_res=True,
			
 
				-                warmup=True)
			
 
				+                det_db_thresh=0.3,
			
 
				+                det_db_box_thresh=0.6,
			
 
				+                det_model_dir="./bank_det_infer/",
			
 
				+                save_crop_res=True,
			
 
				+                rec_model_dir="./bank_rec_infer/",
			
 
				+                rec_char_dict_path="./ppocr_keys_bank.txt",
			
 
				+                use_space_char=False,
			
 
				+                warmup=True
			
 
				+                )
			
 
				+
			
 
				+
			
 
				+origin_ocr = PaddleOCR(use_angle_cls=True,
			
 
				+                       use_gpu=use_gpu,
			
 
				+                       det_db_unclip_ratio=2.5,
			
 
				+                       det_db_thresh=0.3,
			
 
				+                       det_db_box_thresh=0.6,
			
 
				+                       rec_model_dir="./bank_rec_infer/",
			
 
				+                       rec_char_dict_path="./ppocr_keys_bank.txt",
			
 
				+                       use_space_char=False,
			
 
				+                       warmup=True
			
 
				+                       )
			
 
				 
			
 
				 
			
 
				 # ocr = PaddleOCR(use_angle_cls=True,
			
@@ -64,7 +82,7 @@ ocr = PaddleOCR(use_angle_cls=True,
 
				 #                 warmup=True)
			
 
				 
			
 
				 
			
 
				-ad = AngleDetector(ocr)
			
 
				+ad = AngleDetector(origin_ocr)
			
 
				 m = BankOcr(ocr, ad)
			
 
				 
			
 
				 
			
--- a/simfang.ttf
+++ b/simfang.ttf
--- a/testing/error_101_test.py
+++ b/testing/error_101_test.py
--- a/testing/utils.py
+++ b/testing/utils.py
@@ -3,13 +3,14 @@ import base64
 
				 import requests
			
 
				 
			
 
				 
			
 
				-url = 'http://192.168.13.54:18081'
			
 
				+url = 'http://192.168.199.249:2991'
			
 
				 
			
 
				 
			
 
				 # url = 'http://aihub-test.digitalyili.com/aiSquare/openApi/reasoning-services/rlocrxm'
			
 
				 # header = {
			
 
				 #     'Authorization': 'Bearer 9679c2b3-b90b-4029-a3c7-f347b4d242f7'
			
 
				 # }
			
 
				+
			
 
				 def send_request(image_path):
			
 
				     with open(image_path, 'rb') as f:
			
 
				         img_str: str = base64.encodebytes(f.read()).decode('utf-8')
			
--- a/utility.py
+++ b/utility.py
@@ -0,0 +1,646 @@
 
				+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
			
 
				+#
			
 
				+# Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+# you may not use this file except in compliance with the License.
			
 
				+# You may obtain a copy of the License at
			
 
				+#
			
 
				+#     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+#
			
 
				+# Unless required by applicable law or agreed to in writing, software
			
 
				+# distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+# See the License for the specific language governing permissions and
			
 
				+# limitations under the License.
			
 
				+
			
 
				+import argparse
			
 
				+import os
			
 
				+import sys
			
 
				+import platform
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import paddle
			
 
				+from PIL import Image, ImageDraw, ImageFont
			
 
				+import math
			
 
				+from paddle import inference
			
 
				+import time
			
 
				+from ppocr.utils.logging import get_logger
			
 
				+
			
 
				+
			
 
				+def str2bool(v):
			
 
				+    return v.lower() in ("true", "t", "1")
			
 
				+
			
 
				+
			
 
				+def init_args():
			
 
				+    parser = argparse.ArgumentParser()
			
 
				+    # params for prediction engine
			
 
				+    parser.add_argument("--use_gpu", type=str2bool, default=True)
			
 
				+    parser.add_argument("--ir_optim", type=str2bool, default=True)
			
 
				+    parser.add_argument("--use_tensorrt", type=str2bool, default=False)
			
 
				+    parser.add_argument("--min_subgraph_size", type=int, default=15)
			
 
				+    parser.add_argument("--precision", type=str, default="fp32")
			
 
				+    parser.add_argument("--gpu_mem", type=int, default=500)
			
 
				+
			
 
				+    # params for text detector
			
 
				+    parser.add_argument("--image_dir", type=str)
			
 
				+    parser.add_argument("--det_algorithm", type=str, default='DB')
			
 
				+    parser.add_argument("--det_model_dir", type=str)
			
 
				+    parser.add_argument("--det_resize_long", type=float, default=960)
			
 
				+    parser.add_argument("--det_limit_side_len", type=float, default=960)
			
 
				+    parser.add_argument("--det_limit_type", type=str, default='max')
			
 
				+
			
 
				+    # DB parmas
			
 
				+    parser.add_argument("--det_db_thresh", type=float, default=0.3)
			
 
				+    parser.add_argument("--det_db_box_thresh", type=float, default=0.6)
			
 
				+    parser.add_argument("--det_db_unclip_ratio", type=float, default=1.5)
			
 
				+    parser.add_argument("--max_batch_size", type=int, default=10)
			
 
				+    parser.add_argument("--use_dilation", type=str2bool, default=False)
			
 
				+    parser.add_argument("--det_db_score_mode", type=str, default="fast")
			
 
				+    # EAST parmas
			
 
				+    parser.add_argument("--det_east_score_thresh", type=float, default=0.8)
			
 
				+    parser.add_argument("--det_east_cover_thresh", type=float, default=0.1)
			
 
				+    parser.add_argument("--det_east_nms_thresh", type=float, default=0.2)
			
 
				+
			
 
				+    # SAST parmas
			
 
				+    parser.add_argument("--det_sast_score_thresh", type=float, default=0.5)
			
 
				+    parser.add_argument("--det_sast_nms_thresh", type=float, default=0.2)
			
 
				+    parser.add_argument("--det_sast_polygon", type=str2bool, default=False)
			
 
				+
			
 
				+    # PSE parmas
			
 
				+    parser.add_argument("--det_pse_thresh", type=float, default=0)
			
 
				+    parser.add_argument("--det_pse_box_thresh", type=float, default=0.85)
			
 
				+    parser.add_argument("--det_pse_min_area", type=float, default=16)
			
 
				+    parser.add_argument("--det_pse_box_type", type=str, default='quad')
			
 
				+    parser.add_argument("--det_pse_scale", type=int, default=1)
			
 
				+
			
 
				+    # FCE parmas
			
 
				+    parser.add_argument("--scales", type=list, default=[8, 16, 32])
			
 
				+    parser.add_argument("--alpha", type=float, default=1.0)
			
 
				+    parser.add_argument("--beta", type=float, default=1.0)
			
 
				+    parser.add_argument("--fourier_degree", type=int, default=5)
			
 
				+    parser.add_argument("--det_fce_box_type", type=str, default='poly')
			
 
				+
			
 
				+    # params for text recognizer
			
 
				+    parser.add_argument("--rec_algorithm", type=str, default='SVTR_LCNet')
			
 
				+    parser.add_argument("--rec_model_dir", type=str)
			
 
				+    parser.add_argument("--rec_image_shape", type=str, default="3, 48, 320")
			
 
				+    parser.add_argument("--rec_batch_num", type=int, default=6)
			
 
				+    parser.add_argument("--max_text_length", type=int, default=25)
			
 
				+    parser.add_argument(
			
 
				+        "--rec_char_dict_path",
			
 
				+        type=str,
			
 
				+        default="./ppocr/utils/ppocr_keys_v1.txt")
			
 
				+    parser.add_argument("--use_space_char", type=str2bool, default=True)
			
 
				+    parser.add_argument(
			
 
				+        "--vis_font_path", type=str, default="./doc/fonts/simfang.ttf")
			
 
				+    parser.add_argument("--drop_score", type=float, default=0.5)
			
 
				+
			
 
				+    # params for e2e
			
 
				+    parser.add_argument("--e2e_algorithm", type=str, default='PGNet')
			
 
				+    parser.add_argument("--e2e_model_dir", type=str)
			
 
				+    parser.add_argument("--e2e_limit_side_len", type=float, default=768)
			
 
				+    parser.add_argument("--e2e_limit_type", type=str, default='max')
			
 
				+
			
 
				+    # PGNet parmas
			
 
				+    parser.add_argument("--e2e_pgnet_score_thresh", type=float, default=0.5)
			
 
				+    parser.add_argument(
			
 
				+        "--e2e_char_dict_path", type=str, default="./ppocr/utils/ic15_dict.txt")
			
 
				+    parser.add_argument("--e2e_pgnet_valid_set", type=str, default='totaltext')
			
 
				+    parser.add_argument("--e2e_pgnet_mode", type=str, default='fast')
			
 
				+
			
 
				+    # params for text classifier
			
 
				+    parser.add_argument("--use_angle_cls", type=str2bool, default=False)
			
 
				+    parser.add_argument("--cls_model_dir", type=str)
			
 
				+    parser.add_argument("--cls_image_shape", type=str, default="3, 48, 192")
			
 
				+    parser.add_argument("--label_list", type=list, default=['0', '180'])
			
 
				+    parser.add_argument("--cls_batch_num", type=int, default=6)
			
 
				+    parser.add_argument("--cls_thresh", type=float, default=0.9)
			
 
				+
			
 
				+    parser.add_argument("--enable_mkldnn", type=str2bool, default=False)
			
 
				+    parser.add_argument("--cpu_threads", type=int, default=10)
			
 
				+    parser.add_argument("--use_pdserving", type=str2bool, default=False)
			
 
				+    parser.add_argument("--warmup", type=str2bool, default=False)
			
 
				+
			
 
				+    #
			
 
				+    parser.add_argument(
			
 
				+        "--draw_img_save_dir", type=str, default="./inference_results")
			
 
				+    parser.add_argument("--save_crop_res", type=str2bool, default=False)
			
 
				+    parser.add_argument("--crop_res_save_dir", type=str, default="./output")
			
 
				+
			
 
				+    # multi-process
			
 
				+    parser.add_argument("--use_mp", type=str2bool, default=False)
			
 
				+    parser.add_argument("--total_process_num", type=int, default=1)
			
 
				+    parser.add_argument("--process_id", type=int, default=0)
			
 
				+
			
 
				+    parser.add_argument("--benchmark", type=str2bool, default=False)
			
 
				+    parser.add_argument("--save_log_path", type=str, default="./log_output/")
			
 
				+
			
 
				+    parser.add_argument("--show_log", type=str2bool, default=True)
			
 
				+    parser.add_argument("--use_onnx", type=str2bool, default=False)
			
 
				+    return parser
			
 
				+
			
 
				+
			
 
				+def parse_args():
			
 
				+    parser = init_args()
			
 
				+    return parser.parse_args()
			
 
				+
			
 
				+
			
 
				+def create_predictor(args, mode, logger):
			
 
				+    if mode == "det":
			
 
				+        model_dir = args.det_model_dir
			
 
				+    elif mode == 'cls':
			
 
				+        model_dir = args.cls_model_dir
			
 
				+    elif mode == 'rec':
			
 
				+        model_dir = args.rec_model_dir
			
 
				+    elif mode == 'table':
			
 
				+        model_dir = args.table_model_dir
			
 
				+    else:
			
 
				+        model_dir = args.e2e_model_dir
			
 
				+
			
 
				+    if model_dir is None:
			
 
				+        logger.info("not find {} model file path {}".format(mode, model_dir))
			
 
				+        sys.exit(0)
			
 
				+    if args.use_onnx:
			
 
				+        import onnxruntime as ort
			
 
				+        model_file_path = model_dir
			
 
				+        if not os.path.exists(model_file_path):
			
 
				+            raise ValueError("not find model file path {}".format(
			
 
				+                model_file_path))
			
 
				+        sess = ort.InferenceSession(model_file_path)
			
 
				+        return sess, sess.get_inputs()[0], None, None
			
 
				+
			
 
				+    else:
			
 
				+        model_file_path = model_dir + "/inference.pdmodel"
			
 
				+        params_file_path = model_dir + "/inference.pdiparams"
			
 
				+        if not os.path.exists(model_file_path):
			
 
				+            raise ValueError("not find model file path {}".format(
			
 
				+                model_file_path))
			
 
				+        if not os.path.exists(params_file_path):
			
 
				+            raise ValueError("not find params file path {}".format(
			
 
				+                params_file_path))
			
 
				+
			
 
				+        config = inference.Config(model_file_path, params_file_path)
			
 
				+
			
 
				+        if hasattr(args, 'precision'):
			
 
				+            if args.precision == "fp16" and args.use_tensorrt:
			
 
				+                precision = inference.PrecisionType.Half
			
 
				+            elif args.precision == "int8":
			
 
				+                precision = inference.PrecisionType.Int8
			
 
				+            else:
			
 
				+                precision = inference.PrecisionType.Float32
			
 
				+        else:
			
 
				+            precision = inference.PrecisionType.Float32
			
 
				+
			
 
				+        if args.use_gpu:
			
 
				+            gpu_id = get_infer_gpuid()
			
 
				+            if gpu_id is None:
			
 
				+                logger.warning(
			
 
				+                    "GPU is not found in current device by nvidia-smi. Please check your device or ignore it if run on jetson."
			
 
				+                )
			
 
				+            config.enable_use_gpu(args.gpu_mem, 0)
			
 
				+            if args.use_tensorrt:
			
 
				+                config.enable_tensorrt_engine(
			
 
				+                    workspace_size=1 << 30,
			
 
				+                    precision_mode=precision,
			
 
				+                    max_batch_size=args.max_batch_size,
			
 
				+                    min_subgraph_size=args.min_subgraph_size)
			
 
				+                # skip the minmum trt subgraph
			
 
				+            use_dynamic_shape = True
			
 
				+            if mode == "det":
			
 
				+                min_input_shape = {
			
 
				+                    "x": [1, 3, 50, 50],
			
 
				+                    "conv2d_92.tmp_0": [1, 120, 20, 20],
			
 
				+                    "conv2d_91.tmp_0": [1, 24, 10, 10],
			
 
				+                    "conv2d_59.tmp_0": [1, 96, 20, 20],
			
 
				+                    "nearest_interp_v2_1.tmp_0": [1, 256, 10, 10],
			
 
				+                    "nearest_interp_v2_2.tmp_0": [1, 256, 20, 20],
			
 
				+                    "conv2d_124.tmp_0": [1, 256, 20, 20],
			
 
				+                    "nearest_interp_v2_3.tmp_0": [1, 64, 20, 20],
			
 
				+                    "nearest_interp_v2_4.tmp_0": [1, 64, 20, 20],
			
 
				+                    "nearest_interp_v2_5.tmp_0": [1, 64, 20, 20],
			
 
				+                    "elementwise_add_7": [1, 56, 2, 2],
			
 
				+                    "nearest_interp_v2_0.tmp_0": [1, 256, 2, 2]
			
 
				+                }
			
 
				+                max_input_shape = {
			
 
				+                    "x": [1, 3, 1536, 1536],
			
 
				+                    "conv2d_92.tmp_0": [1, 120, 400, 400],
			
 
				+                    "conv2d_91.tmp_0": [1, 24, 200, 200],
			
 
				+                    "conv2d_59.tmp_0": [1, 96, 400, 400],
			
 
				+                    "nearest_interp_v2_1.tmp_0": [1, 256, 200, 200],
			
 
				+                    "conv2d_124.tmp_0": [1, 256, 400, 400],
			
 
				+                    "nearest_interp_v2_2.tmp_0": [1, 256, 400, 400],
			
 
				+                    "nearest_interp_v2_3.tmp_0": [1, 64, 400, 400],
			
 
				+                    "nearest_interp_v2_4.tmp_0": [1, 64, 400, 400],
			
 
				+                    "nearest_interp_v2_5.tmp_0": [1, 64, 400, 400],
			
 
				+                    "elementwise_add_7": [1, 56, 400, 400],
			
 
				+                    "nearest_interp_v2_0.tmp_0": [1, 256, 400, 400]
			
 
				+                }
			
 
				+                opt_input_shape = {
			
 
				+                    "x": [1, 3, 640, 640],
			
 
				+                    "conv2d_92.tmp_0": [1, 120, 160, 160],
			
 
				+                    "conv2d_91.tmp_0": [1, 24, 80, 80],
			
 
				+                    "conv2d_59.tmp_0": [1, 96, 160, 160],
			
 
				+                    "nearest_interp_v2_1.tmp_0": [1, 256, 80, 80],
			
 
				+                    "nearest_interp_v2_2.tmp_0": [1, 256, 160, 160],
			
 
				+                    "conv2d_124.tmp_0": [1, 256, 160, 160],
			
 
				+                    "nearest_interp_v2_3.tmp_0": [1, 64, 160, 160],
			
 
				+                    "nearest_interp_v2_4.tmp_0": [1, 64, 160, 160],
			
 
				+                    "nearest_interp_v2_5.tmp_0": [1, 64, 160, 160],
			
 
				+                    "elementwise_add_7": [1, 56, 40, 40],
			
 
				+                    "nearest_interp_v2_0.tmp_0": [1, 256, 40, 40]
			
 
				+                }
			
 
				+                min_pact_shape = {
			
 
				+                    "nearest_interp_v2_26.tmp_0": [1, 256, 20, 20],
			
 
				+                    "nearest_interp_v2_27.tmp_0": [1, 64, 20, 20],
			
 
				+                    "nearest_interp_v2_28.tmp_0": [1, 64, 20, 20],
			
 
				+                    "nearest_interp_v2_29.tmp_0": [1, 64, 20, 20]
			
 
				+                }
			
 
				+                max_pact_shape = {
			
 
				+                    "nearest_interp_v2_26.tmp_0": [1, 256, 400, 400],
			
 
				+                    "nearest_interp_v2_27.tmp_0": [1, 64, 400, 400],
			
 
				+                    "nearest_interp_v2_28.tmp_0": [1, 64, 400, 400],
			
 
				+                    "nearest_interp_v2_29.tmp_0": [1, 64, 400, 400]
			
 
				+                }
			
 
				+                opt_pact_shape = {
			
 
				+                    "nearest_interp_v2_26.tmp_0": [1, 256, 160, 160],
			
 
				+                    "nearest_interp_v2_27.tmp_0": [1, 64, 160, 160],
			
 
				+                    "nearest_interp_v2_28.tmp_0": [1, 64, 160, 160],
			
 
				+                    "nearest_interp_v2_29.tmp_0": [1, 64, 160, 160]
			
 
				+                }
			
 
				+                min_input_shape.update(min_pact_shape)
			
 
				+                max_input_shape.update(max_pact_shape)
			
 
				+                opt_input_shape.update(opt_pact_shape)
			
 
				+            elif mode == "rec":
			
 
				+                if args.rec_algorithm not in ["CRNN", "SVTR_LCNet"]:
			
 
				+                    use_dynamic_shape = False
			
 
				+                imgH = int(args.rec_image_shape.split(',')[-2])
			
 
				+                min_input_shape = {"x": [1, 3, imgH, 10]}
			
 
				+                max_input_shape = {"x": [args.rec_batch_num, 3, imgH, 2304]}
			
 
				+                opt_input_shape = {"x": [args.rec_batch_num, 3, imgH, 320]}
			
 
				+            elif mode == "cls":
			
 
				+                min_input_shape = {"x": [1, 3, 48, 10]}
			
 
				+                max_input_shape = {"x": [args.rec_batch_num, 3, 48, 1024]}
			
 
				+                opt_input_shape = {"x": [args.rec_batch_num, 3, 48, 320]}
			
 
				+            else:
			
 
				+                use_dynamic_shape = False
			
 
				+            if use_dynamic_shape:
			
 
				+                config.set_trt_dynamic_shape_info(
			
 
				+                    min_input_shape, max_input_shape, opt_input_shape)
			
 
				+
			
 
				+        else:
			
 
				+            config.disable_gpu()
			
 
				+            if hasattr(args, "cpu_threads"):
			
 
				+                config.set_cpu_math_library_num_threads(args.cpu_threads)
			
 
				+            else:
			
 
				+                # default cpu threads as 10
			
 
				+                config.set_cpu_math_library_num_threads(10)
			
 
				+            if args.enable_mkldnn:
			
 
				+                # cache 10 different shapes for mkldnn to avoid memory leak
			
 
				+                config.set_mkldnn_cache_capacity(10)
			
 
				+                config.enable_mkldnn()
			
 
				+                if args.precision == "fp16":
			
 
				+                    config.enable_mkldnn_bfloat16()
			
 
				+        # enable memory optim
			
 
				+        config.enable_memory_optim()
			
 
				+        config.disable_glog_info()
			
 
				+        config.delete_pass("conv_transpose_eltwiseadd_bn_fuse_pass")
			
 
				+        config.delete_pass("matmul_transpose_reshape_fuse_pass")
			
 
				+        if mode == 'table':
			
 
				+            config.delete_pass("fc_fuse_pass")  # not supported for table
			
 
				+        config.switch_use_feed_fetch_ops(False)
			
 
				+        config.switch_ir_optim(True)
			
 
				+
			
 
				+        # create predictor
			
 
				+        predictor = inference.create_predictor(config)
			
 
				+        input_names = predictor.get_input_names()
			
 
				+        for name in input_names:
			
 
				+            input_tensor = predictor.get_input_handle(name)
			
 
				+        output_tensors = get_output_tensors(args, mode, predictor)
			
 
				+        return predictor, input_tensor, output_tensors, config
			
 
				+
			
 
				+
			
 
				+def get_output_tensors(args, mode, predictor):
			
 
				+    output_names = predictor.get_output_names()
			
 
				+    output_tensors = []
			
 
				+    if mode == "rec" and args.rec_algorithm in ["CRNN", "SVTR_LCNet"]:
			
 
				+        output_name = 'softmax_0.tmp_0'
			
 
				+        if output_name in output_names:
			
 
				+            return [predictor.get_output_handle(output_name)]
			
 
				+        else:
			
 
				+            for output_name in output_names:
			
 
				+                output_tensor = predictor.get_output_handle(output_name)
			
 
				+                output_tensors.append(output_tensor)
			
 
				+    else:
			
 
				+        for output_name in output_names:
			
 
				+            output_tensor = predictor.get_output_handle(output_name)
			
 
				+            output_tensors.append(output_tensor)
			
 
				+    return output_tensors
			
 
				+
			
 
				+
			
 
				+def get_infer_gpuid():
			
 
				+    sysstr = platform.system()
			
 
				+    if sysstr == "Windows":
			
 
				+        return 0
			
 
				+
			
 
				+    if not paddle.fluid.core.is_compiled_with_rocm():
			
 
				+        cmd = "env | grep CUDA_VISIBLE_DEVICES"
			
 
				+    else:
			
 
				+        cmd = "env | grep HIP_VISIBLE_DEVICES"
			
 
				+    env_cuda = os.popen(cmd).readlines()
			
 
				+    if len(env_cuda) == 0:
			
 
				+        return 0
			
 
				+    else:
			
 
				+        gpu_id = env_cuda[0].strip().split("=")[1]
			
 
				+        return int(gpu_id[0])
			
 
				+
			
 
				+
			
 
				+def draw_e2e_res(dt_boxes, strs, img_path):
			
 
				+    src_im = cv2.imread(img_path)
			
 
				+    for box, str in zip(dt_boxes, strs):
			
 
				+        box = box.astype(np.int32).reshape((-1, 1, 2))
			
 
				+        cv2.polylines(src_im, [box], True, color=(255, 255, 0), thickness=2)
			
 
				+        cv2.putText(
			
 
				+            src_im,
			
 
				+            str,
			
 
				+            org=(int(box[0, 0, 0]), int(box[0, 0, 1])),
			
 
				+            fontFace=cv2.FONT_HERSHEY_COMPLEX,
			
 
				+            fontScale=0.7,
			
 
				+            color=(0, 255, 0),
			
 
				+            thickness=1)
			
 
				+    return src_im
			
 
				+
			
 
				+
			
 
				+def draw_text_det_res(dt_boxes, img_path):
			
 
				+    src_im = cv2.imread(img_path)
			
 
				+    for box in dt_boxes:
			
 
				+        box = np.array(box).astype(np.int32).reshape(-1, 2)
			
 
				+        cv2.polylines(src_im, [box], True, color=(255, 255, 0), thickness=2)
			
 
				+    return src_im
			
 
				+
			
 
				+
			
 
				+def resize_img(img, input_size=600):
			
 
				+    """
			
 
				+    resize img and limit the longest side of the image to input_size
			
 
				+    """
			
 
				+    img = np.array(img)
			
 
				+    im_shape = img.shape
			
 
				+    im_size_max = np.max(im_shape[0:2])
			
 
				+    im_scale = float(input_size) / float(im_size_max)
			
 
				+    img = cv2.resize(img, None, None, fx=im_scale, fy=im_scale)
			
 
				+    return img
			
 
				+
			
 
				+
			
 
				+def draw_ocr(image,
			
 
				+             boxes,
			
 
				+             txts=None,
			
 
				+             scores=None,
			
 
				+             drop_score=0.5,
			
 
				+             font_path="./doc/fonts/simfang.ttf"):
			
 
				+    """
			
 
				+    Visualize the results of OCR detection and recognition
			
 
				+    args:
			
 
				+        image(Image|array): RGB image
			
 
				+        boxes(list): boxes with shape(N, 4, 2)
			
 
				+        txts(list): the texts
			
 
				+        scores(list): txxs corresponding scores
			
 
				+        drop_score(float): only scores greater than drop_threshold will be visualized
			
 
				+        font_path: the path of font which is used to draw text
			
 
				+    return(array):
			
 
				+        the visualized img
			
 
				+    """
			
 
				+    if scores is None:
			
 
				+        scores = [1] * len(boxes)
			
 
				+    box_num = len(boxes)
			
 
				+    for i in range(box_num):
			
 
				+        if scores is not None and (scores[i] < drop_score or
			
 
				+                                   math.isnan(scores[i])):
			
 
				+            continue
			
 
				+        box = np.reshape(np.array(boxes[i]), [-1, 1, 2]).astype(np.int64)
			
 
				+        image = cv2.polylines(np.array(image), [box], True, (255, 0, 0), 2)
			
 
				+    if txts is not None:
			
 
				+        img = np.array(resize_img(image, input_size=600))
			
 
				+        txt_img = text_visual(
			
 
				+            txts,
			
 
				+            scores,
			
 
				+            img_h=img.shape[0],
			
 
				+            img_w=600,
			
 
				+            threshold=drop_score,
			
 
				+            font_path=font_path)
			
 
				+        img = np.concatenate([np.array(img), np.array(txt_img)], axis=1)
			
 
				+        return img
			
 
				+    return image
			
 
				+
			
 
				+
			
 
				+def draw_ocr_box_txt(image,
			
 
				+                     boxes,
			
 
				+                     txts,
			
 
				+                     scores=None,
			
 
				+                     drop_score=0.5,
			
 
				+                     font_path="./doc/simfang.ttf"):
			
 
				+    h, w = image.height, image.width
			
 
				+    img_left = image.copy()
			
 
				+    img_right = Image.new('RGB', (w, h), (255, 255, 255))
			
 
				+
			
 
				+    import random
			
 
				+
			
 
				+    random.seed(0)
			
 
				+    draw_left = ImageDraw.Draw(img_left)
			
 
				+    draw_right = ImageDraw.Draw(img_right)
			
 
				+    for idx, (box, txt) in enumerate(zip(boxes, txts)):
			
 
				+        if scores is not None and scores[idx] < drop_score:
			
 
				+            continue
			
 
				+        color = (random.randint(0, 255), random.randint(0, 255),
			
 
				+                 random.randint(0, 255))
			
 
				+        draw_left.polygon(box, fill=color)
			
 
				+        draw_right.polygon(
			
 
				+            [
			
 
				+                box[0][0], box[0][1], box[1][0], box[1][1], box[2][0],
			
 
				+                box[2][1], box[3][0], box[3][1]
			
 
				+            ],
			
 
				+            outline=color)
			
 
				+        box_height = math.sqrt((box[0][0] - box[3][0])**2 + (box[0][1] - box[3][
			
 
				+            1])**2)
			
 
				+        box_width = math.sqrt((box[0][0] - box[1][0])**2 + (box[0][1] - box[1][
			
 
				+            1])**2)
			
 
				+        if box_height > 2 * box_width:
			
 
				+            font_size = max(int(box_width * 0.9), 10)
			
 
				+            font = ImageFont.truetype(font_path, font_size, encoding="utf-8")
			
 
				+            cur_y = box[0][1]
			
 
				+            for c in txt:
			
 
				+                char_size = font.getsize(c)
			
 
				+                draw_right.text(
			
 
				+                    (box[0][0] + 3, cur_y), c, fill=(0, 0, 0), font=font)
			
 
				+                cur_y += char_size[1]
			
 
				+        else:
			
 
				+            font_size = max(int(box_height * 0.8), 10)
			
 
				+            font = ImageFont.truetype(font_path, font_size, encoding="utf-8")
			
 
				+            draw_right.text(
			
 
				+                [box[0][0], box[0][1]], txt, fill=(0, 0, 0), font=font)
			
 
				+    img_left = Image.blend(image, img_left, 0.5)
			
 
				+    img_show = Image.new('RGB', (w * 2, h), (255, 255, 255))
			
 
				+    img_show.paste(img_left, (0, 0, w, h))
			
 
				+    img_show.paste(img_right, (w, 0, w * 2, h))
			
 
				+    return np.array(img_show)
			
 
				+
			
 
				+
			
 
				+def str_count(s):
			
 
				+    """
			
 
				+    Count the number of Chinese characters,
			
 
				+    a single English character and a single number
			
 
				+    equal to half the length of Chinese characters.
			
 
				+    args:
			
 
				+        s(string): the input of string
			
 
				+    return(int):
			
 
				+        the number of Chinese characters
			
 
				+    """
			
 
				+    import string
			
 
				+    count_zh = count_pu = 0
			
 
				+    s_len = len(s)
			
 
				+    en_dg_count = 0
			
 
				+    for c in s:
			
 
				+        if c in string.ascii_letters or c.isdigit() or c.isspace():
			
 
				+            en_dg_count += 1
			
 
				+        elif c.isalpha():
			
 
				+            count_zh += 1
			
 
				+        else:
			
 
				+            count_pu += 1
			
 
				+    return s_len - math.ceil(en_dg_count / 2)
			
 
				+
			
 
				+
			
 
				+def text_visual(texts,
			
 
				+                scores,
			
 
				+                img_h=400,
			
 
				+                img_w=600,
			
 
				+                threshold=0.,
			
 
				+                font_path="./doc/simfang.ttf"):
			
 
				+    """
			
 
				+    create new blank img and draw txt on it
			
 
				+    args:
			
 
				+        texts(list): the text will be draw
			
 
				+        scores(list|None): corresponding score of each txt
			
 
				+        img_h(int): the height of blank img
			
 
				+        img_w(int): the width of blank img
			
 
				+        font_path: the path of font which is used to draw text
			
 
				+    return(array):
			
 
				+    """
			
 
				+    if scores is not None:
			
 
				+        assert len(texts) == len(
			
 
				+            scores), "The number of txts and corresponding scores must match"
			
 
				+
			
 
				+    def create_blank_img():
			
 
				+        blank_img = np.ones(shape=[img_h, img_w], dtype=np.int8) * 255
			
 
				+        blank_img[:, img_w - 1:] = 0
			
 
				+        blank_img = Image.fromarray(blank_img).convert("RGB")
			
 
				+        draw_txt = ImageDraw.Draw(blank_img)
			
 
				+        return blank_img, draw_txt
			
 
				+
			
 
				+    blank_img, draw_txt = create_blank_img()
			
 
				+
			
 
				+    font_size = 20
			
 
				+    txt_color = (0, 0, 0)
			
 
				+    font = ImageFont.truetype(font_path, font_size, encoding="utf-8")
			
 
				+
			
 
				+    gap = font_size + 5
			
 
				+    txt_img_list = []
			
 
				+    count, index = 1, 0
			
 
				+    for idx, txt in enumerate(texts):
			
 
				+        index += 1
			
 
				+        if scores[idx] < threshold or math.isnan(scores[idx]):
			
 
				+            index -= 1
			
 
				+            continue
			
 
				+        first_line = True
			
 
				+        while str_count(txt) >= img_w // font_size - 4:
			
 
				+            tmp = txt
			
 
				+            txt = tmp[:img_w // font_size - 4]
			
 
				+            if first_line:
			
 
				+                new_txt = str(index) + ': ' + txt
			
 
				+                first_line = False
			
 
				+            else:
			
 
				+                new_txt = '    ' + txt
			
 
				+            draw_txt.text((0, gap * count), new_txt, txt_color, font=font)
			
 
				+            txt = tmp[img_w // font_size - 4:]
			
 
				+            if count >= img_h // gap - 1:
			
 
				+                txt_img_list.append(np.array(blank_img))
			
 
				+                blank_img, draw_txt = create_blank_img()
			
 
				+                count = 0
			
 
				+            count += 1
			
 
				+        if first_line:
			
 
				+            new_txt = str(index) + ': ' + txt + '   ' + '%.3f' % (scores[idx])
			
 
				+        else:
			
 
				+            new_txt = "  " + txt + "  " + '%.3f' % (scores[idx])
			
 
				+        draw_txt.text((0, gap * count), new_txt, txt_color, font=font)
			
 
				+        # whether add new blank img or not
			
 
				+        if count >= img_h // gap - 1 and idx + 1 < len(texts):
			
 
				+            txt_img_list.append(np.array(blank_img))
			
 
				+            blank_img, draw_txt = create_blank_img()
			
 
				+            count = 0
			
 
				+        count += 1
			
 
				+    txt_img_list.append(np.array(blank_img))
			
 
				+    if len(txt_img_list) == 1:
			
 
				+        blank_img = np.array(txt_img_list[0])
			
 
				+    else:
			
 
				+        blank_img = np.concatenate(txt_img_list, axis=1)
			
 
				+    return np.array(blank_img)
			
 
				+
			
 
				+
			
 
				+def base64_to_cv2(b64str):
			
 
				+    import base64
			
 
				+    data = base64.b64decode(b64str.encode('utf8'))
			
 
				+    data = np.fromstring(data, np.uint8)
			
 
				+    data = cv2.imdecode(data, cv2.IMREAD_COLOR)
			
 
				+    return data
			
 
				+
			
 
				+
			
 
				+def draw_boxes(image, boxes, scores=None, drop_score=0.5):
			
 
				+    if scores is None:
			
 
				+        scores = [1] * len(boxes)
			
 
				+    for (box, score) in zip(boxes, scores):
			
 
				+        if score < drop_score:
			
 
				+            continue
			
 
				+        box = np.reshape(np.array(box), [-1, 1, 2]).astype(np.int64)
			
 
				+        image = cv2.polylines(np.array(image), [box], True, (255, 0, 0), 2)
			
 
				+    return image
			
 
				+
			
 
				+
			
 
				+def get_rotate_crop_image(img, points):
			
 
				+    '''
			
 
				+    img_height, img_width = img.shape[0:2]
			
 
				+    left = int(np.min(points[:, 0]))
			
 
				+    right = int(np.max(points[:, 0]))
			
 
				+    top = int(np.min(points[:, 1]))
			
 
				+    bottom = int(np.max(points[:, 1]))
			
 
				+    img_crop = img[top:bottom, left:right, :].copy()
			
 
				+    points[:, 0] = points[:, 0] - left
			
 
				+    points[:, 1] = points[:, 1] - top
			
 
				+    '''
			
 
				+    assert len(points) == 4, "shape of points must be 4*2"
			
 
				+    img_crop_width = int(
			
 
				+        max(
			
 
				+            np.linalg.norm(points[0] - points[1]),
			
 
				+            np.linalg.norm(points[2] - points[3])))
			
 
				+    img_crop_height = int(
			
 
				+        max(
			
 
				+            np.linalg.norm(points[0] - points[3]),
			
 
				+            np.linalg.norm(points[1] - points[2])))
			
 
				+    pts_std = np.float32([[0, 0], [img_crop_width, 0],
			
 
				+                          [img_crop_width, img_crop_height],
			
 
				+                          [0, img_crop_height]])
			
 
				+    M = cv2.getPerspectiveTransform(points, pts_std)
			
 
				+    dst_img = cv2.warpPerspective(
			
 
				+        img,
			
 
				+        M, (img_crop_width, img_crop_height),
			
 
				+        borderMode=cv2.BORDER_REPLICATE,
			
 
				+        flags=cv2.INTER_CUBIC)
			
 
				+    dst_img_height, dst_img_width = dst_img.shape[0:2]
			
 
				+    if dst_img_height * 1.0 / dst_img_width >= 1.5:
			
 
				+        dst_img = np.rot90(dst_img)
			
 
				+    return dst_img
			
 
				+
			
 
				+
			
 
				+def check_gpu(use_gpu):
			
 
				+    if use_gpu and not paddle.is_compiled_with_cuda():
			
 
				+        use_gpu = False
			
 
				+    return use_gpu
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    pass