1
0
Fork 0
mirror of https://github.com/qurator-spk/page2tsv.git synced 2025-06-09 19:39:54 +02:00

make code more robust

This commit is contained in:
Kai 2021-05-06 15:13:26 +02:00
parent 49861b1652
commit d4eb95b64b

View file

@ -29,7 +29,7 @@ def write_tsv(tsv, urls, tsv_out_file):
for url_id, part in tsv.groupby('url_id'):
with open(tsv_out_file, 'a') as f:
f.write('# ' + urls[url_id] + '\n')
f.write('# ' + urls[int(url_id)] + '\n')
part.to_csv(tsv_out_file, sep="\t", quoting=3, index=False, mode='a', header=False)