Merge pull request #253 from harry0703/dev

optimize segmentation
This commit is contained in:
Harry 2024-04-13 21:04:22 +08:00 committed by GitHub
commit b1506b9161
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 17 additions and 2 deletions

View File

@ -53,7 +53,7 @@ listen_port = _cfg.get("listen_port", 8080)
project_name = _cfg.get("project_name", "MoneyPrinterTurbo")
project_description = _cfg.get("project_description",
"<a href='https://github.com/harry0703/MoneyPrinterTurbo'>https://github.com/harry0703/MoneyPrinterTurbo</a>")
project_version = _cfg.get("project_version", "1.1.0")
project_version = _cfg.get("project_version", "1.1.1")
reload_debug = False
imagemagick_path = app.get("imagemagick_path", "")

View File

@ -163,12 +163,27 @@ def str_contains_punctuation(word):
def split_string_by_punctuations(s):
result = []
txt = ""
for char in s:
previous_char = ""
next_char = ""
for i in range(len(s)):
char = s[i]
if i > 0:
previous_char = s[i - 1]
if i < len(s) - 1:
next_char = s[i + 1]
if char == "." and previous_char.isdigit() and next_char.isdigit():
# 取现1万按2.5%收取手续费, 2.5 中的 . 不能作为换行标记
txt += char
continue
if char not in const.PUNCTUATIONS:
txt += char
else:
result.append(txt.strip())
txt = ""
return result