diff --git a/src/python/run_train_ner.py b/src/python/run_train_ner.py index 0f61d7534731c7ced0bd8bea6fab4adf77a4bca3..158787244b9fc5f96ab038db13014cc92462047d 100644 --- a/src/python/run_train_ner.py +++ b/src/python/run_train_ner.py @@ -115,7 +115,7 @@ def main(model=None, output_dir=None, n_iter=100, training_data=None, trained_da if output_dir is not None: output_dir = Path(output_dir) if not output_dir.exists(): - output_dir.mkdir() + output_dir.mkdir(parents=True) nlp.to_disk(output_dir) print("Saved model to", output_dir) diff --git a/src/sh/train_ner.sh b/src/sh/train_ner.sh new file mode 100755 index 0000000000000000000000000000000000000000..edf6042cc595a643fd4232724f5280c3ac1c039f --- /dev/null +++ b/src/sh/train_ner.sh @@ -0,0 +1,14 @@ +#!/bin/bash + +path_data=data/train_NER/ +model=de_core_news_sm +n_iter=2 +training_data=${path_data}1891_20026449_corrected_german.txt +trained_data=${path_data}1891_20026449_corrected_german_trained.txt +new_model=${path_data}models/de_1891_20026449 + +#renku run --isolation --output $trained_data --output $new_model +python src/python/run_train_ner.py -m $model -n $n_iter -t $training_data -o $new_model -u $trained_data + + +