调整涂抹的ocr模型参数;优化关键词

This commit is contained in:
2024-07-19 12:15:02 +08:00
parent 69f4fecd4f
commit 5193839c9e
2 changed files with 13 additions and 10 deletions

View File

@@ -1,4 +1,4 @@
from paddlenlp.utils.doc_parser import DocParser
from paddleocr import PaddleOCR
"""
项目配置
@@ -19,11 +19,11 @@ UPLOAD_TRY_TIMES = 3
"""
NAME_KEYS = [
{"key": "姓名", "length": 4},
{"key": "交款人", "length": 4},
{"key": "款人", "length": 4},
{"key": "娃名", "length": 4},
{"key": "款人", "length": 4},
{"key": "购买方名称", "length": 4},
]
ID_CARD_NUM_KEYS = [{"key": "身份证号", "length": 19}, ]
# OCR = PaddleOCR(use_angle_cls=False, show_log=False, gpu_id=1)
OCR = DocParser(use_gpu=True, layout_analysis=False)
# 如果不希望识别出空格可以设置use_space_char=False。做此项设置一定要测试2.7.3版本此项设置有bug会导致识别失败
OCR = PaddleOCR(use_angle_cls=False, show_log=False, det_db_box_thresh=0.3)