sxwl_DL
/
hr-ocr-idcard


			
				
					
						
						
							1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
							from dataclasses import dataclass
from typing import Any

from core.line_parser import LineParser
from core.parser import *
from core.direction import *
import numpy as np
from paddleocr import PaddleOCR

# 身份证OCR
@dataclass
class IdCardOcr:
    ocr: PaddleOCR
    # 方向探测器
    angle_detector: AngleDetector

    # 检测
    def predict(self, image: np.ndarray, image_type) -> ():
        image_type = int(image_type)

        image, angle, result = self._pre_process(image, image_type)
        print(f'---------- detect angle: {angle} 角度 --------')
        if image_type == 0 and angle != 0 or image_type != 0:
            # 角度不为0 需要重新识别,字面
            _, _, result = self._ocr(image)
        return self._post_process(result, angle, image_type)

    # 预处理(旋转图片)
    def _pre_process(self, image, image_type) -> (np.ndarray, int, Any):
        # pic角度 result(ocr生)
        angle, result = self.angle_detector.detect_angle(image, image_type)

        if angle == 1:
            image = cv2.rotate(image, cv2.ROTATE_90_COUNTERCLOCKWISE)
        if angle == 2:
            image = cv2.rotate(image, cv2.ROTATE_180)
        if angle == 3:
            image = cv2.rotate(image, cv2.ROTATE_90_CLOCKWISE)

        return image, angle, result

    # 获取模型检测结果
    def _ocr(self, image):
        result = self.ocr.ocr(image, cls=True)
        print("------------------")
        print(result)
        if not result:
            raise Exception('无法识别')
        confs = [line[1][1] for line in result]
        # 将检测到的文字放到一个列表中
        txts = [line[1][0] for line in result]
        return txts, confs, result

    def _post_process(self, result, angle: int, image_type):
        filters = [lambda x: x.is_slope, lambda x: x.txt.replace(' ', '').encode('utf-8').isalpha()]
        line_parser = LineParser(result, filters)
        line_result = line_parser.parse()
        conf = line_parser.confidence

        if int(image_type) == 0:
            parser = FrontParser(line_result)
        elif int(image_type) == 1:
            parser = BackParser(line_result)
        else:
            raise Exception('无法识别')
        ocr_res = parser.parse()
        res = {
            "confidence": conf,
            "card_type": str(image_type),
            "orientation": angle,  # 原angle是逆时针，转成顺时针
            **ocr_res
        }
        print(res)
        return res