Merge pull request #132 from qurator-spk/fix/uniseg-removed-index-parameter

🐛 Fix for changed API of uniseg's word_break
pull/134/head
Mike Gerber 5 days ago committed by GitHub
commit a09a624bde
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

@ -25,7 +25,7 @@ jobs:
strategy: strategy:
fail-fast: false fail-fast: false
matrix: matrix:
python-version: [ "3.8", "3.9", "3.10", "3.11", "3.12", "3.13" ] python-version: [ "3.9", "3.10", "3.11", "3.12", "3.13" ]
runs-on: "ubuntu-latest" runs-on: "ubuntu-latest"

@ -1,7 +1,7 @@
click click
jinja2 jinja2
lxml lxml
uniseg >= 0.8.0 uniseg >= 0.9.1
numpy numpy
colorama colorama
MarkupSafe MarkupSafe

@ -22,11 +22,11 @@ def patch_word_break():
""" """
old_word_break = uniseg.wordbreak.word_break old_word_break = uniseg.wordbreak.word_break
def new_word_break(c, index=0): def new_word_break(c):
if 0xE000 <= ord(c) <= 0xF8FF: # Private Use Area if 0xE000 <= ord(c) <= 0xF8FF: # Private Use Area
return uniseg.wordbreak.WordBreak.ALETTER return uniseg.wordbreak.Word_Break.ALetter
else: else:
return old_word_break(c, index) return old_word_break(c)
uniseg.wordbreak.word_break = new_word_break uniseg.wordbreak.word_break = new_word_break
global word_break_patched global word_break_patched

Loading…
Cancel
Save