mirror of
https://github.com/qurator-spk/sbb_ner.git
synced 2025-10-24 15:14:13 +02:00
Merge branch 'master' of code.dev.sbb.berlin:qurator/mono-repo
This commit is contained in:
commit
19c4eaa15f
2 changed files with 7 additions and 2 deletions
4
Makefile
4
Makefile
|
@ -199,8 +199,10 @@ $(BUILD_PATH)/bert-all-german-de-finetuned/$(EPOCH_FILE):
|
||||||
bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN' --dev_sets='GERM-EVAL-DEV|DE-CONLL-TESTA' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
|
bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN' --dev_sets='GERM-EVAL-DEV|DE-CONLL-TESTA' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
|
||||||
|
|
||||||
$(BUILD_PATH)/bert-complete-de-finetuned/$(EPOCH_FILE):
|
$(BUILD_PATH)/bert-complete-de-finetuned/$(EPOCH_FILE):
|
||||||
bert-ner --train_sets='GERM-EVAL-TRAIN|DE-CONLL-TRAIN|SBB|ONB|LFT|DE-CONLL-TESTA|DE-CONLL-TESTB|GERM-EVAL-TEST' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
|
bert-ner --train_sets='GERM-EVAL-TRAIN|GERM-EVAL-DEV|DE-CONLL-TRAIN|DE-CONLL-DEV|SBB|ONB|LFT|DE-CONLL-TESTA|DE-CONLL-TESTB|GERM-EVAL-TEST' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
|
||||||
|
|
||||||
|
$(BUILD_PATH)/bert-multilang-de-finetuned/$(EPOCH_FILE):
|
||||||
|
bert-ner --train_sets='GERM-EVAL-DEV|GERM-EVAL-TEST|GERM-EVAL-TRAIN|SBB|ONB|LFT|BNF|KB|DE-CONLL-DEV|DE-CONLL-TESTA|DE-CONLL-TESTB|DE-CONLL-TRAIN|EN-CONLL-TESTA|EN-CONLL-TESTB|EN-CONLL-TRAIN' --bert_model=$(BERT_FINETUNED_PATH) --output_dir=$(@D) $(BERT_NER_OPTIONS) >> $(@D).log 2<&1
|
||||||
|
|
||||||
|
|
||||||
$(BUILD_PATH)/bert-wikiner-de-finetuned/$(EPOCH_FILE):
|
$(BUILD_PATH)/bert-wikiner-de-finetuned/$(EPOCH_FILE):
|
||||||
|
|
|
@ -61,7 +61,10 @@ def main(path_to_ner_corpora, ner_ground_truth_file):
|
||||||
|
|
||||||
gt_all = read_gt(['{}/enp_DE.sbb.bio/enp_DE.sbb.bio'.format(path_to_ner_corpora),
|
gt_all = read_gt(['{}/enp_DE.sbb.bio/enp_DE.sbb.bio'.format(path_to_ner_corpora),
|
||||||
'{}/enp_DE.onb.bio/enp_DE.onb.bio'.format(path_to_ner_corpora),
|
'{}/enp_DE.onb.bio/enp_DE.onb.bio'.format(path_to_ner_corpora),
|
||||||
'{}/enp_DE.lft.bio/enp_DE.lft.bio'.format(path_to_ner_corpora)], ['SBB', 'ONB', 'LFT'])
|
'{}/enp_DE.lft.bio/enp_DE.lft.bio'.format(path_to_ner_corpora),
|
||||||
|
'{}/enp_FR.bnf.bio/enp_FR.bnf.bio'.format(path_to_ner_corpora),
|
||||||
|
'{}/enp_NL.kb.bio/enp_NL.kb.bio'.format(path_to_ner_corpora)],
|
||||||
|
['SBB', 'ONB', 'LFT', 'BNF', 'KB'])
|
||||||
|
|
||||||
gt_all.to_pickle(ner_ground_truth_file)
|
gt_all.to_pickle(ner_ground_truth_file)
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue