10 lines
354 B
Bash
Executable File
10 lines
354 B
Bash
Executable File
#!/bin/sh
|
|
|
|
CORPUS_NAME=opensubtitles_sample
|
|
CORPUS_PATH=./$CORPUS_NAME
|
|
SRC_LANG_ID=1
|
|
TRG_LANG_ID=2
|
|
|
|
./addFastAlignedTM.py $CORPUS_NAME $CORPUS_PATH/src_clean.txt $CORPUS_PATH/src_clean.lem $SRC_LANG_ID $CORPUS_PATH/trg_clean.txt $TRG_LANG_ID $CORPUS_PATH/alignments.txt $CORPUS_PATH/ids_clean.txt
|
|
./addSources.py $CORPUS_PATH/ids_sources_censored.txt
|