sxwl_DL
/
hr-ocr-idcard


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
							from dataclasses import dataclass
from core.idcrad import *
from core.direction import *
import numpy as np
from paddleocr import PaddleOCR


@dataclass
class IdCardOcr:
    ocr: PaddleOCR
    image: np.ndarray
    image_type: str = '0'

    def predict(self):
        txts, confs, angle = self._ocr()
        if int(self.image_type) == 0:
            parser = FrontParser(txts, confs)
        elif int(self.image_type) == 1:
            parser = BackParser(txts, confs)

        return self._post_process(angle, parser, self.image_type)

    def _align_image(self, image):
        angle = detect_angle(image)
        print(angle)  # 逆时针
        if angle == 180:
            image = cv2.rotate(image, cv2.ROTATE_180)
        if angle == 90:
            image = cv2.rotate(image, cv2.ROTATE_90_CLOCKWISE)
        if angle == 270:
            image = cv2.rotate(image, cv2.ROTATE_90_COUNTERCLOCKWISE)
        return image, angle

    def _ocr(self):
        image = self.image
        image, angle = self._align_image(image)
        # 获取模型检测结果
        result = self.ocr.ocr(image, cls=True)
        print("------------------")
        print(result)
        if not result:
            return None
        confs = [line[1][1] for line in result]

        # 将检测到的文字放到一个列表中
        txts = [line[1][0] for line in result]
        print("......................................")
        print(txts)
        print("......................................")
        return txts, confs, angle


    def _post_process(self, angle: int, parser: Parser, image_type: str):
        content = parser.parse()
        conf = parser.confidence

        return {
            "confidence": conf,
            "card_type": image_type,
            "orientation": angle // 90,
            "name": content["Name"].to_dict(),
            "id": content["IDNumber"].to_dict(),
            "ethnicity": content["Nationality"].to_dict(),
            "gender": content["Gender"].to_dict(),
            "birthday": content["Birth"].to_dict(),
            "address_province": content["address_province"].to_dict(),
            "address_city": content["address_city"].to_dict(),
            "address_region": content["address_region"].to_dict(),
            "address_detail": content["address_detail"].to_dict(),
            "expire_date": content["expire_date"].to_dict()
        }