From 8e86337ff164addc0bcc0fd95e42b207680a909a Mon Sep 17 00:00:00 2001 From: liuyebo <1515783401@qq.com> Date: Wed, 14 Aug 2024 11:25:04 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BC=98=E5=8C=96=E5=8C=BB=E9=99=A2=E5=90=8D?= =?UTF-8?q?=E7=B9=81=E7=AE=80=E8=BD=AC=E6=8D=A2?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- docker-compose.yml | 2 +- photo_review/__init__.py | 1 + requirements.txt | 1 + util/data_util.py | 4 ++-- util/util.py | 8 ++++++++ 5 files changed, 13 insertions(+), 3 deletions(-) diff --git a/docker-compose.yml b/docker-compose.yml index 110255e..b70d4b3 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -1,6 +1,6 @@ x-env: &template - image: fcb_photo_review:1.12.2 + image: fcb_photo_review:1.12.3 restart: always services: diff --git a/photo_review/__init__.py b/photo_review/__init__.py index 8051056..f5aaa0b 100644 --- a/photo_review/__init__.py +++ b/photo_review/__init__.py @@ -69,6 +69,7 @@ HOSPITAL_ALIAS = { "江阴徐霞客医院": ["江阴市徐霞客医院"], "江阴北国医院": ["江阴市北国医院"], "溧阳茶亭医院": ["溧阳市茶亭医院"], + "南京市六合中医院": ["南京市六合区中医院"] } """ diff --git a/requirements.txt b/requirements.txt index f408f85..f4e4cf2 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,5 +1,6 @@ numpy==1.26.4 onnxconverter-common==1.14.0 +OpenCC==1.1.9 opencv-python==4.6.0.66 paddle2onnx==1.2.3 paddleclas==2.5.2 diff --git a/util/data_util.py b/util/data_util.py index bb9ad6c..aa97138 100644 --- a/util/data_util.py +++ b/util/data_util.py @@ -181,8 +181,8 @@ def parse_hospital(string): if not string: return result + string = util.traditional_to_simple_chinese(string) string_without_brackets = string.replace(")", "").replace(")", "").replace("(", " ").replace("(", " ") string_without_company = string_without_brackets.replace("有限公司", "") - simple_chinese_string = string_without_company.replace("醫", "医") - result += simple_chinese_string.split(" ") + result += string_without_company.split(" ") return result diff --git a/util/util.py b/util/util.py index 41d7b60..29b9737 100644 --- a/util/util.py +++ b/util/util.py @@ -2,6 +2,8 @@ import logging import os from datetime import datetime +from opencc import OpenCC + from util import string_util @@ -209,3 +211,9 @@ def chinese_money_to_number(chinese_money_amount): amount += j / 10 amount += f / 100 return round(amount, 2) + + +# 将繁体字转换为简体字 +def traditional_to_simple_chinese(traditional_chinese): + converter = OpenCC('t2s') + return converter.convert(traditional_chinese)