From b72e02acb799979f259dd51c20dccb755f138702 Mon Sep 17 00:00:00 2001 From: Jakub Maruniak Date: Sun, 21 Mar 2021 20:11:39 +0000 Subject: [PATCH] =?UTF-8?q?Smazat=20=E2=80=9Epages/students/2016/jakub=5Fm?= =?UTF-8?q?aruniak/dp2021/annotation/train/prepare.sh=E2=80=9C?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../dp2021/annotation/train/prepare.sh | 19 ------------------- 1 file changed, 19 deletions(-) delete mode 100644 pages/students/2016/jakub_maruniak/dp2021/annotation/train/prepare.sh diff --git a/pages/students/2016/jakub_maruniak/dp2021/annotation/train/prepare.sh b/pages/students/2016/jakub_maruniak/dp2021/annotation/train/prepare.sh deleted file mode 100644 index ade40371f4..0000000000 --- a/pages/students/2016/jakub_maruniak/dp2021/annotation/train/prepare.sh +++ /dev/null @@ -1,19 +0,0 @@ -mkdir -p build -mkdir -p build/input -# Prepare Treebank -mkdir -p build/input/slovak-treebank -spacy convert ./sources/slovak-treebank/stb.conll ./build/input/slovak-treebank -# UDAG used as evaluation -mkdir -p build/input/ud-artificial-gapping -spacy convert ./sources/ud-artificial-gapping/sk-ud-crawled-orphan.conllu ./build/input/ud-artificial-gapping -# Prepare skner -mkdir -p build/input/skner -# Convert to IOB -cat ./sources/skner/wikiann-sk.bio | python ./sources/bio-to-iob.py > build/input/skner/wikiann-sk.iob -# Split to train test -cat ./build/input/skner/wikiann-sk.iob | python ./sources/iob-to-traintest.py ./build/input/skner/wikiann-sk -# Convert train and test -mkdir -p build/input/skner-train -spacy convert -n 15 --converter ner ./build/input/skner/wikiann-sk.train ./build/input/skner-train -mkdir -p build/input/skner-test -spacy convert -n 15 --converter ner ./build/input/skner/wikiann-sk.test ./build/input/skner-test