Remove support for ExtractedText for bag metrics.

2025-10-29 08:24:16 +01:00 · 2021-06-11 10:23:26 +02:00 · 2021-06-11 10:23:26 +02:00 · 9f5112f8f6
commit 9f5112f8f6
parent 381fe7cb6b
2 changed files with 1 additions and 10 deletions
--- a/qurator/dinglehopper/metrics/bag_of_words_accuracy.py
+++ b/qurator/dinglehopper/metrics/bag_of_words_accuracy.py
@ -1,20 +1,12 @@
 from collections import Counter
-from typing import Union

 from .utils import bag_accuracy, MetricResult, Weights
-from .. import ExtractedText
 from ..normalize import words_normalized


 def bag_of_words_accuracy(
-    reference: Union[str, ExtractedText],
-    compared: Union[str, ExtractedText],
-    weights: Weights,
+    reference: str, compared: str, weights: Weights
 ) -> MetricResult:
-    if isinstance(reference, ExtractedText):
-        reference = reference.text
-    if isinstance(compared, ExtractedText):
-        compared = compared.text
    reference_words = Counter(words_normalized(reference))
    compared_words = Counter(words_normalized(compared))
    result = bag_accuracy(reference_words, compared_words, weights)
--- a/qurator/dinglehopper/tests/metrics/test_bag_accuracy.py
+++ b/qurator/dinglehopper/tests/metrics/test_bag_accuracy.py
@ -1,4 +1,3 @@
-import math
 import unicodedata
 from collections import Counter