forked from KEMT/zpwiki
		
	
		
			
				
	
	
		
			25 lines
		
	
	
		
			919 B
		
	
	
	
		
			Bash
		
	
	
	
	
	
			
		
		
	
	
			25 lines
		
	
	
		
			919 B
		
	
	
	
		
			Bash
		
	
	
	
	
	
| set -e
 | |
| OUTDIR=build/train/output
 | |
| TRAINDIR=build/train
 | |
| 
 | |
| # Delete old training results
 | |
| rm -r $TRAINDIR
 | |
|    
 | |
| mkdir -p $TRAINDIR
 | |
| mkdir -p $OUTDIR
 | |
| mkdir -p dist
 | |
| # Delete old training results
 | |
| rm -rf $OUTDIR/*
 | |
| # Train dependency and POS
 | |
| spacy train sk $OUTDIR ./build/input/slovak-treebank ./build/input/ud-artificial-gapping  --n-iter 15 -p tagger,parser
 | |
| rm -rf $TRAINDIR/posparser
 | |
| mv $OUTDIR/model-best $TRAINDIR/posparser
 | |
| # Train NER
 | |
| # custom script for training, but it takes too long... input is JSONL file (db from Prodigy)
 | |
| # python custom_train.py train ./build/train/posparser ./train.jsonl ./eval.jsonl -o ./build/train/nerposparser -n 15
 | |
| spacy train sk $TRAINDIR/nerposparser ./ner/experiments/34sknerfull.json ./ner/experiments/34wikiartfull.json --n-iter 15 -p ner
 | |
| # Package model
 | |
| spacy package $TRAINDIR/nerposparser dist --meta-path ./meta.json --force
 | |
| cd dist/sk_sk1-0.2.0
 | |
| python ./setup.py sdist --dist-dir ../
 |