1
0
Fork 0
mirror of https://github.com/qurator-spk/modstool.git synced 2025-06-08 11:20:07 +02:00

🧹 Do not duplicate ALTO metadata

This commit is contained in:
Gerber, Mike 2022-05-06 19:36:50 +02:00
parent 6e2e0bd67a
commit 102b15ffa9

View file

@ -116,12 +116,8 @@ def process(alto_files: List[str], output_file: str, output_csv: str, output_xls
with warnings.catch_warnings(record=True) as caught_warnings: with warnings.catch_warnings(record=True) as caught_warnings:
warnings.simplefilter('always') # do NOT filter double occurrences warnings.simplefilter('always') # do NOT filter double occurrences
# MODS # ALTO
d = flatten(alto_to_dict(alto, raise_errors=True)) d = flatten(alto_to_dict(alto, raise_errors=True))
# METS
d_alto = flatten(alto_to_dict(alto, raise_errors=True))
for k, v in d_alto.items():
d[f"alto_{k}"] = v
# "meta" # "meta"
d['alto_file'] = alto_file d['alto_file'] = alto_file