Merge branch 'master' of code.dev.sbb.berlin:qurator/mono-repo

pull/2/head
Kai Labusch 5 years ago
commit 19c4eaa15f

@ -199,8 +199,10 @@ $(BUILD_PATH)/bert-all-german-de-finetuned/$(EPOCH_FILE):
bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN' --dev_sets='GERM-EVAL-DEV|DE-CONLL-TESTA' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1 bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN' --dev_sets='GERM-EVAL-DEV|DE-CONLL-TESTA' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
$(BUILD_PATH)/bert-complete-de-finetuned/$(EPOCH_FILE): $(BUILD_PATH)/bert-complete-de-finetuned/$(EPOCH_FILE):
bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN|SBB|ONB|LFT|DE-CONLL-TESTA|DE-CONLL-TESTB|GERM-EVAL-TEST' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1 bert-ner --train_sets='GERM-EVAL-TRAIN|GERM-EVAL-DEV|DE-CONLL-TRAIN|DE-CONLL-DEV|SBB|ONB|LFT|DE-CONLL-TESTA|DE-CONLL-TESTB|GERM-EVAL-TEST' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
$(BUILD_PATH)/bert-multilang-de-finetuned/$(EPOCH_FILE):
bert-ner --train_sets='GERM-EVAL-DEV|GERM-EVAL-TEST|GERM-EVAL-TRAIN|SBB|ONB|LFT|BNF|KB|DE-CONLL-DEV|DE-CONLL-TESTA|DE-CONLL-TESTB|DE-CONLL-TRAIN|EN-CONLL-TESTA|EN-CONLL-TESTB|EN-CONLL-TRAIN' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
$(BUILD_PATH)/bert-wikiner-de-finetuned/$(EPOCH_FILE): $(BUILD_PATH)/bert-wikiner-de-finetuned/$(EPOCH_FILE):

@ -61,7 +61,10 @@ def main(path_to_ner_corpora, ner_ground_truth_file):
gt_all = read_gt(['{}/enp_DE.sbb.bio/enp_DE.sbb.bio'.format(path_to_ner_corpora), gt_all = read_gt(['{}/enp_DE.sbb.bio/enp_DE.sbb.bio'.format(path_to_ner_corpora),
'{}/enp_DE.onb.bio/enp_DE.onb.bio'.format(path_to_ner_corpora), '{}/enp_DE.onb.bio/enp_DE.onb.bio'.format(path_to_ner_corpora),
'{}/enp_DE.lft.bio/enp_DE.lft.bio'.format(path_to_ner_corpora)], ['SBB', 'ONB', 'LFT']) '{}/enp_DE.lft.bio/enp_DE.lft.bio'.format(path_to_ner_corpora),
'{}/enp_FR.bnf.bio/enp_FR.bnf.bio'.format(path_to_ner_corpora),
'{}/enp_NL.kb.bio/enp_NL.kb.bio'.format(path_to_ner_corpora)],
['SBB', 'ONB', 'LFT', 'BNF', 'KB'])
gt_all.to_pickle(ner_ground_truth_file) gt_all.to_pickle(ner_ground_truth_file)

Loading…
Cancel
Save