1
0
Fork 0
mirror of https://github.com/qurator-spk/page2tsv.git synced 2025-06-09 19:39:54 +02:00

Add directory parsing option to make-page2tsv-commands

This commit is contained in:
Kai 2021-03-10 12:03:45 +01:00
parent aa79678403
commit c554644838

View file

@ -268,7 +268,7 @@ def make_page2tsv_commands(xls_file, directory, purpose):
elif directory is not None:
for file in glob.glob('{}/**/*.xml'.format(directory), recursive=True):
ma = re.match('(.*/(PPN[0-9]+)/([0-9]+)).xml', file)
ma = re.match('(.*/(PPN[0-9]+)/.*?([0-9]+).*?).xml', file)
if ma:
print('page2tsv {} {}.tsv '