2019-02-22 22:13:45 +01:00
|
|
|
#!/bin/sh
|
|
|
|
|
2019-02-26 14:00:10 +01:00
|
|
|
CORPUS_NAME=opensubtitles
|
2019-02-22 22:13:45 +01:00
|
|
|
CORPUS_PATH=../fast-aligner/corpora/$CORPUS_NAME
|
|
|
|
SRC_LANG_ID=1
|
|
|
|
TRG_LANG_ID=2
|
|
|
|
|
|
|
|
./addFastAlignedTM.py $CORPUS_NAME $CORPUS_PATH/src_clean.txt $CORPUS_PATH/src_clean.lem $SRC_LANG_ID $CORPUS_PATH/trg_clean.txt $TRG_LANG_ID $CORPUS_PATH/alignments.txt $CORPUS_PATH/ids_clean.txt
|