From 493541fddf86f8d57688c82f25a7b35e472c0581 Mon Sep 17 00:00:00 2001 From: "Gerber, Mike" Date: Tue, 1 Oct 2019 12:35:44 +0200 Subject: [PATCH] =?UTF-8?q?=F0=9F=90=9B=20dinglehopper:=20Always=20work=20?= =?UTF-8?q?with=20NFC=20text?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- qurator/dinglehopper/substitute_equivalences.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/qurator/dinglehopper/substitute_equivalences.py b/qurator/dinglehopper/substitute_equivalences.py index faa873e..3556a52 100644 --- a/qurator/dinglehopper/substitute_equivalences.py +++ b/qurator/dinglehopper/substitute_equivalences.py @@ -1,3 +1,6 @@ +import unicodedata + + def substitute_equivalences(s): # These are for OCR-D GT vs Tesseract frk vs Calamari GT4HistOCR