From b92d166be60054799256295cb99669929ae864b7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Rafa=C5=82=20Jaworski?= Date: Thu, 30 May 2019 11:32:51 +0200 Subject: [PATCH] script added --- tools/addSample.sh | 9 +++++++++ 1 file changed, 9 insertions(+) create mode 100755 tools/addSample.sh diff --git a/tools/addSample.sh b/tools/addSample.sh new file mode 100755 index 0000000..a62051e --- /dev/null +++ b/tools/addSample.sh @@ -0,0 +1,9 @@ +#!/bin/sh + +CORPUS_NAME=opensubtitles_sample +CORPUS_PATH=./$CORPUS_NAME +SRC_LANG_ID=1 +TRG_LANG_ID=2 + +./addFastAlignedTM.py $CORPUS_NAME $CORPUS_PATH/src_clean.txt $CORPUS_PATH/src_clean.lem $SRC_LANG_ID $CORPUS_PATH/trg_clean.txt $TRG_LANG_ID $CORPUS_PATH/alignments.txt $CORPUS_PATH/ids_clean.txt +./addSources.py $CORPUS_PATH/ids_sources_censored.txt