提高涂抹的准确性

2024-07-11 17:25:36 +08:00
parent e3198ccdf6
commit fee59b3133
1 changed files with 55 additions and 6 deletions
--- a/photo_mask.py
+++ b/photo_mask.py
@@ -76,6 +76,11 @@ def split_image(img, max_ratio=1.41, best_ration=1.41, overlap=0.05):
    return split_result


+def capture_image(img, layout):
+    x1, y1, x2, y2 = layout
+    return img[int(y1):int(y2), int(x1):int(x2)]
+
+
 # 获取图片旋转角度
 def get_image_rotation_angles(img):
    angles = ['0', '90']
@@ -182,7 +187,16 @@ def get_ocr_layout(ocr, img_path):
    return layout


-def find_box_of_content(content, layout):
+def zoom_box(box, ratio):
+    x1, y1, x2, y2 = box
+    x1 = round(x1 - x1 * ratio)
+    y1 = round(y1 - y1 * ratio)
+    x2 = round(x2 + x2 * ratio)
+    y2 = round(y2 + y2 * ratio)
+    return [x1, y1, x2, y2]
+
+
+def find_box_of_content(content, layout, img_path):
    full_box = layout[0]
    x_len = full_box[2] - full_box[0]
    y_len = full_box[3] - full_box[1]
@@ -201,20 +215,55 @@ def find_box_of_content(content, layout):

    if direction == "x":
        # 横向排布
-        return (
+        box = [
            full_box[0] + index * char_len,
            full_box[1],
            full_box[0] + (index + len(content) + 1) * char_len,
            full_box[3],
-        )
+        ]
+        is_abnormal = box[2] - box[0] < (box[3] - box[1]) * len(content) / 2
    else:
        # 纵向排布
-        return (
+        box = [
            full_box[0],
            full_box[1] + index * char_len,
            full_box[2],
            full_box[1] + (index + len(content) + 1) * char_len,
-        )
+        ]
+        is_abnormal = box[3] - box[1] < (box[2] - box[0]) * len(content) / 2
+
+    if is_abnormal:
+        # 比例异常，再次识别
+        image = cv2.imread(img_path)
+        # 截图时偏大一点
+        capture_box = zoom_box(box, 0.2)
+        captured_image = capture_image(image, capture_box)
+        with tempfile.NamedTemporaryFile(suffix=".jpg", delete=False) as temp_file:
+            cv2.imwrite(temp_file.name, captured_image)
+        try:
+            layouts = DOC_PARSER.parse({"doc": temp_file.name})["layout"]
+        except TypeError:
+            # 如果是类型错误，大概率是没识别到文字
+            layouts = []
+        except Exception as e:
+            # 如果出现其他错误，抛出
+            raise e
+        for layout in layouts:
+            if content in layout[1]:
+                temp_box = find_box_of_content(content, layout, temp_file.name)
+                if temp_box:
+                    box = [
+                        temp_box[0] + capture_box[0],
+                        temp_box[1] + capture_box[1],
+                        temp_box[2] + capture_box[0],
+                        temp_box[3] + capture_box[1],
+                    ]
+                    break
+        try:
+            os.remove(temp_file.name)
+        except Exception as e:
+            logging.info(f"删除临时文件 {temp_file.name} 时出错", exc_info=e)
+    return box


 def find_box_of_value(key, layout, length):
@@ -275,7 +324,7 @@ def get_mask_layout(image, contents):
            for layout in layouts:
                for content in contents:
                    if content in layout[1]:
-                        result.append(find_box_of_content(content, layout))
+                        result.append(find_box_of_content(content, layout, temp_file.name))
                if "姓名" in layout[1]:
                    result.append(find_box_of_value("姓名", layout, 4))
                if "交款人" in layout[1]: