1
0
Fork 0
mirror of https://github.com/qurator-spk/dinglehopper.git synced 2025-06-07 19:05:13 +02:00

🐛 Fix word segmentation with uniseg 0.8.0

This commit is contained in:
Mike Gerber 2024-03-26 19:34:22 +01:00
parent 4b64398cec
commit 4d4ead4cc8
2 changed files with 2 additions and 2 deletions

View file

@ -1,7 +1,7 @@
click
jinja2
lxml
uniseg >= 0.7.2
uniseg >= 0.8.0
numpy
colorama
MarkupSafe

View file

@ -24,7 +24,7 @@ def patch_word_break():
def new_word_break(c, index=0):
if 0xE000 <= ord(c) <= 0xF8FF: # Private Use Area
return "ALetter"
return uniseg.wordbreak.WordBreak.ALETTER
else:
return old_word_break(c, index)