remove spam

master
Kai Labusch 1 month ago
parent ef8244a466
commit 8d8bf517b9

@ -346,13 +346,6 @@ def tsv2tsv(tsv_in_file, tsv_out_file, ner_rest_endpoint, noproxy,
prev_pos = 0
for idx, _ in tsv_out.iterrows():
# if idx < len(tsv_out) and len(tsv_out.loc[idx, 'TOKEN']) == 0 and tsv_out.loc[idx+1, 'No.'] == 0:
# print("word_pos=0!!!!")
# word_pos = 0
#
# if 0 < tsv_out.loc[idx, 'No.'] < word_pos:
# word_pos = 0
if prev_pos != 0 and not tsv_out.loc[idx, 'NE-TAG'].startswith('I-') and \
tsv_out.loc[idx, 'No.'] == 0 or len(tsv_out.loc[idx, 'TOKEN']) == 0:
word_pos = 0

Loading…
Cancel
Save