concordia-docker/tools/addSample.sh

10 lines
354 B
Bash
Raw Normal View History

2019-05-30 11:32:51 +02:00
#!/bin/sh
CORPUS_NAME=opensubtitles_sample
CORPUS_PATH=./$CORPUS_NAME
SRC_LANG_ID=1
TRG_LANG_ID=2
./addFastAlignedTM.py $CORPUS_NAME $CORPUS_PATH/src_clean.txt $CORPUS_PATH/src_clean.lem $SRC_LANG_ID $CORPUS_PATH/trg_clean.txt $TRG_LANG_ID $CORPUS_PATH/alignments.txt $CORPUS_PATH/ids_clean.txt
./addSources.py $CORPUS_PATH/ids_sources_censored.txt