chenguilong
/
test_script


			
							123456789101112131415161718192021222324252627282930313233343536373839404142
							import numpy as np
from itertools import chain
from mdutils.mdutils import MdUtils
from YQ_OCR.utils.datasets import Dataset
from YQ_OCR.utils.text2md import TableMD
from YQ_OCR.utils.utils import *

# 1. xlsx -> 正确json文件(写入厂家信息)
# 2. 发送图片(带正确json文件)
# 3. 把返回的json 和正确的json 进行对比(有key--用返回结果与正确结果比对,无key--用正确结果与返回结果比对)


if __name__ == '__main__':
    img_paths = chain(*[Path(imgs_path).rglob(f'*.{ext}') for ext in ['jpg', 'png', 'jpeg']])
    all_rate = []
    table_mean_acc = []
    for img_path in img_paths:
        print(img_path)
        true_d, true_json = open_true_json(img_path.with_suffix('.json'))
        result = send_request(img_path, true_json)
        res_d = parse_result(result)

        markdown = TableMD(img_path.name)
        markdown.write_header(title='推理结果', level=2)
        # json result
        rate, statistics = markdown.evaluate_one(true_d, res_d)
        all_rate.append(rate)
        print(f'文字识别正确率：{rate:.2f}%')

        # table gt result
        dataset = Dataset(gt_file=img_path.with_suffix('.txt'), img_name=img_path.name, results=res_d)
        markdown.write_table_accuracy(ds=dataset, key='new')
        table_acc = markdown.get_table_accuracy()
        table_mean_acc.append(table_acc)
        print(f'表格识别正确率：{table_acc:.2f}%')
        markdown.f.create_md_file()

    print('----------------------------------------')
    all_rate = "{:.2f}%".format(np.mean(all_rate))
    all_table_rate = "{:.2f}%".format(np.mean(table_mean_acc))
    print(f'文字识别总体正确率：{all_rate}')
    print(f'表格识别总体正确率：{all_table_rate}')