diff --git a/qurator/mods4pandas/mods4pandas.py b/qurator/mods4pandas/mods4pandas.py index 7229d37..ffc3697 100755 --- a/qurator/mods4pandas/mods4pandas.py +++ b/qurator/mods4pandas/mods4pandas.py @@ -323,8 +323,10 @@ def pages_to_dict(mets, raise_errors=True) -> List[Dict]: while (cursor := cursor.getparent()).tag == f"{{{ns['mets']}}}div": yield cursor + struct_divs_to_add = set() for struct_div in struct_divs: - struct_divs.update(get_struct_log_parents(struct_div)) + struct_divs_to_add.update(get_struct_log_parents(struct_div)) + struct_divs.update(struct_divs_to_add) for struct_div in struct_divs: type_ = struct_div.attrib.get("TYPE")