2 years ago · a0b1c05114
--- a/.gitignore
+++ b/.gitignore
@@ -2,5 +2,5 @@
 
				 .idea
			
 
				 .vscode
			
 
				 __pycache__/
			
 
				-*.json
			
 
				-*.md
			
 
				+#*.json
			
 
				+#*.md
			
--- a/HR_OCR/test_script/to_md/README.md
+++ b/HR_OCR/test_script/to_md/README.md
@@ -0,0 +1,46 @@
 
				+# 人力OCR
			
 
				+
			
 
				+## 生成markdown测试报告脚本
			
 
				+
			
 
				+1. 生成**目的文件夹**下图片的**json文件**
			
 
				+
			
 
				+- **目的文件夹**: 
			
 
				+  - 存放所需测试**图片文件夹**
			
 
				+  - 对**文件夹**内图片进行标准化
			
 
				+    - 运行`suffix.py`脚本
			
 
				+    - 产生*.jpg
			
 
				+  - 生成<u>算法推理json文件</u>
			
 
				+    - 运行`convert_json.py`脚本
			
 
				+    - 产生对应jpg 文件的json文件
			
 
				+  - 修改<u>算法推理json文件</u>成**正确的json文件**
			
 
				+
			
 
				+2. 跑生成md报告脚本
			
 
				+
			
 
				+- 修改use.py 并运行
			
 
				+
			
 
				+  ```python
			
 
				+  # config
			
 
				+  
			
 
				+  # 目的文件夹
			
 
				+  image_path = Path('/Users/zeke/work/sx/OCR/image_data/户口本9.30/0/img/')
			
 
				+  # 图片type(如果接口不存在传0不影响结果)
			
 
				+  image_type = 0
			
 
				+  # 是否旋转
			
 
				+  image_rotate = False
			
 
				+  
			
 
				+  # ocr地址选择
			
 
				+  # 本地环境、腾讯云测试环境、腾讯云生产环境、电信云测试环境、电信云生产环境
			
 
				+  ocr_address = 'local'  # 'local' 'TXtest' 'TXsb' 'DXtest' 'DXsb'
			
 
				+  # ocr能力选择
			
 
				+  ocr_name = 'regbook'  # 'cet' 'idcard' 'bankcard' 'regbook' 'schoolcert' 'business_license'
			
 
				+  # 生产MD文件名
			
 
				+  md_name = 'RegBook'
			
 
				+  # ocr能力对应字段（）
			
 
				+  filed = 'regbook'
			
 
				+  
			
 
				+  # 若md_path为None 则默认使用图片父路径为markdown保存路径
			
 
				+  # md_path = '/Users/zeke/work/sx/OCR/HROCR/to_md/example' or image_path.parent
			
 
				+  md_path = None or image_path.parent
			
 
				+  ```
			
 
				+
			
 
				+  
			
--- a/HR_OCR/test_script/to_md/example/img/1_img.json
+++ b/HR_OCR/test_script/to_md/example/img/1_img.json
@@ -0,0 +1,9 @@
 
				+{
			
 
				+    "orientation": 0,
			
 
				+    "name": "鉴康",
			
 
				+    "id": "152801200003178527",
			
 
				+    "language": "英语",
			
 
				+    "level": "CET4",
			
 
				+    "exam_time": "2021年6月",
			
 
				+    "score": "451"
			
 
				+}
			
--- a/HR_OCR/test_script/to_md/example/img/2_img.json
+++ b/HR_OCR/test_script/to_md/example/img/2_img.json
@@ -0,0 +1,9 @@
 
				+{
			
 
				+    "orientation": 0,
			
 
				+    "name": "张鑫",
			
 
				+    "id": "140227199809282317",
			
 
				+    "language": "英语",
			
 
				+    "level": "CET4",
			
 
				+    "exam_time": "2021年6月",
			
 
				+    "score": "445"
			
 
				+}
			
--- a/HR_OCR/test_script/tools/README.md
+++ b/HR_OCR/test_script/tools/README.md
@@ -0,0 +1,34 @@
 
				+# 人力OCR
			
 
				+
			
 
				+## convert_json.py
			
 
				+
			
 
				+```python
			
 
				+# 项目url
			
 
				+url = 'http://192.168.199.27:18040'
			
 
				+# 目标文件夹
			
 
				+imgs_path = './HR_OCR/to_md/example/img'
			
 
				+
			
 
				+def send_request(img_path, image_type = 0):
			
 
				+    with open(img_path, 'rb') as f:
			
 
				+        img_str: str = base64.encodebytes(f.read()).decode('utf-8')
			
 
				+        data = {
			
 
				+            'image': img_str,
			
 
				+            'image_type': image_type
			
 
				+        }
			
 
				+        idc_header = {
			
 
				+            'Content-Type': 'application/json',
			
 
				+            'Authorization': 'Bearer 4e00c444-620b-4d3c-85f4-777e64276f0e'
			
 
				+        }
			
 
				+        r = requests.post(f'{url}/cettest/cet', json=data, headers=idc_header)
			
 
				+        # r = requests.post(f'{url}/hkbsbtest/regbook', json=data)
			
 
				+        print(r.json())
			
 
				+        return r.json()
			
 
				+```
			
 
				+
			
 
				+## suffix.py
			
 
				+
			
 
				+```python
			
 
				+# 需要格式化的目的文件夹路径
			
 
				+target_path = './HR_OCR/to_md/example/img'
			
 
				+```
			
 
				+
			
--- a/HR_OCR/to_md/README.md
+++ b/HR_OCR/to_md/README.md
@@ -0,0 +1,46 @@
 
				+# 人力OCR
			
 
				+
			
 
				+## 生成markdown测试报告脚本
			
 
				+
			
 
				+1. 生成**目的文件夹**下图片的**json文件**
			
 
				+
			
 
				+- **目的文件夹**: 
			
 
				+  - 存放所需测试**图片文件夹**
			
 
				+  - 对**文件夹**内图片进行标准化
			
 
				+    - 运行`suffix.py`脚本
			
 
				+    - 产生*.jpg
			
 
				+  - 生成<u>算法推理json文件</u>
			
 
				+    - 运行`convert_json.py`脚本
			
 
				+    - 产生对应jpg 文件的json文件
			
 
				+  - 修改<u>算法推理json文件</u>成**正确的json文件**
			
 
				+
			
 
				+2. 跑生成md报告脚本
			
 
				+
			
 
				+- 修改use.py 并运行
			
 
				+
			
 
				+  ```python
			
 
				+  # config
			
 
				+  
			
 
				+  # 目的文件夹
			
 
				+  image_path = Path('/Users/zeke/work/sx/OCR/image_data/户口本9.30/0/img/')
			
 
				+  # 图片type(如果接口不存在传0不影响结果)
			
 
				+  image_type = 0
			
 
				+  # 是否旋转
			
 
				+  image_rotate = False
			
 
				+  
			
 
				+  # ocr地址选择
			
 
				+  # 本地环境、腾讯云测试环境、腾讯云生产环境、电信云测试环境、电信云生产环境
			
 
				+  ocr_address = 'local'  # 'local' 'TXtest' 'TXsb' 'DXtest' 'DXsb'
			
 
				+  # ocr能力选择
			
 
				+  ocr_name = 'regbook'  # 'cet' 'idcard' 'bankcard' 'regbook' 'schoolcert' 'business_license'
			
 
				+  # 生产MD文件名
			
 
				+  md_name = 'RegBook'
			
 
				+  # ocr能力对应字段（）
			
 
				+  filed = 'regbook'
			
 
				+  
			
 
				+  # 若md_path为None 则默认使用图片父路径为markdown保存路径
			
 
				+  # md_path = '/Users/zeke/work/sx/OCR/HROCR/to_md/example' or image_path.parent
			
 
				+  md_path = None or image_path.parent
			
 
				+  ```
			
 
				+
			
 
				+  
			
--- a/HR_OCR/to_md/example/img/1_img.json
+++ b/HR_OCR/to_md/example/img/1_img.json
@@ -0,0 +1,9 @@
 
				+{
			
 
				+    "orientation": 0,
			
 
				+    "name": "鉴康",
			
 
				+    "id": "152801200003178527",
			
 
				+    "language": "英语",
			
 
				+    "level": "CET4",
			
 
				+    "exam_time": "2021年6月",
			
 
				+    "score": "451"
			
 
				+}
			
--- a/HR_OCR/to_md/example/img/2_img.json
+++ b/HR_OCR/to_md/example/img/2_img.json
@@ -0,0 +1,9 @@
 
				+{
			
 
				+    "orientation": 0,
			
 
				+    "name": "张鑫",
			
 
				+    "id": "140227199809282317",
			
 
				+    "language": "英语",
			
 
				+    "level": "CET4",
			
 
				+    "exam_time": "2021年6月",
			
 
				+    "score": "445"
			
 
				+}
			
--- a/HR_OCR/tools/README.md
+++ b/HR_OCR/tools/README.md
@@ -0,0 +1,34 @@
 
				+# 人力OCR
			
 
				+
			
 
				+## convert_json.py
			
 
				+
			
 
				+```python
			
 
				+# 项目url
			
 
				+url = 'http://192.168.199.27:18040'
			
 
				+# 目标文件夹
			
 
				+imgs_path = './HR_OCR/to_md/example/img'
			
 
				+
			
 
				+def send_request(img_path, image_type = 0):
			
 
				+    with open(img_path, 'rb') as f:
			
 
				+        img_str: str = base64.encodebytes(f.read()).decode('utf-8')
			
 
				+        data = {
			
 
				+            'image': img_str,
			
 
				+            'image_type': image_type
			
 
				+        }
			
 
				+        idc_header = {
			
 
				+            'Content-Type': 'application/json',
			
 
				+            'Authorization': 'Bearer 4e00c444-620b-4d3c-85f4-777e64276f0e'
			
 
				+        }
			
 
				+        r = requests.post(f'{url}/cettest/cet', json=data, headers=idc_header)
			
 
				+        # r = requests.post(f'{url}/hkbsbtest/regbook', json=data)
			
 
				+        print(r.json())
			
 
				+        return r.json()
			
 
				+```
			
 
				+
			
 
				+## suffix.py
			
 
				+
			
 
				+```python
			
 
				+# 需要格式化的目的文件夹路径
			
 
				+target_path = './HR_OCR/to_md/example/img'
			
 
				+```
			
 
				+