transfix-train/scripts/marian-train.sh

51 lines
1.4 KiB
Bash
Raw Normal View History

2022-01-14 18:45:36 +01:00
#!/bin/bash
# arguments
# 1. root of gonito.net challenge-like filestructure
2022-01-15 18:07:27 +01:00
# 2. number of BPE merge operations, E.g. 32000
# 3. expected number of train epochs
2022-01-14 18:45:36 +01:00
# path to corpus
corpus_path="$1"
2022-01-15 20:10:06 +01:00
bpe_merges="$2"
epochs="$3"
2022-01-14 18:45:36 +01:00
2022-01-15 20:10:06 +01:00
source_file="$corpus_path"/train/in.tsv."$bpe_merges"
2022-01-15 18:07:27 +01:00
source_vocab="$source_file".vocab."$bpe_merges".yml
2022-01-14 18:45:36 +01:00
2022-01-15 20:10:06 +01:00
target_file="$corpus_path"/train/expected.tsv."$bpe_merges"
2022-01-15 18:07:27 +01:00
target_vocab="$target_file".vocab."$bpe_merges".yml
2022-01-14 18:45:36 +01:00
2022-01-15 18:07:27 +01:00
~/marian/build/marian \
2022-01-14 19:11:01 +01:00
--type transformer \
2022-01-14 19:08:32 +01:00
--overwrite \
2022-01-14 18:45:36 +01:00
--train-sets "$source_file" "$target_file" \
--max-length 100 \
--mini-batch-fit -w 10000 --maxi-batch 1000 \
--valid-freq 5000 \
--save-freq 5000 \
--disp-freq 500 \
--beam-size 6 --normalize 0.6 \
--enc-depth 6 --dec-depth 6 \
--transformer-heads 8 \
--transformer-postprocess-emb d \
--transformer-postprocess dan \
--transformer-dropout 0.1 --label-smoothing 0.1 \
--learn-rate 0.0003 --lr-warmup 16000 --lr-decay-inv-sqrt 16000 --lr-report \
--optimizer-params 0.9 0.98 1e-09 --clip-norm 5 \
2022-01-15 18:07:27 +01:00
--tied-embeddings \
2022-01-14 19:08:32 +01:00
--exponential-smoothing \
2022-01-14 19:11:51 +01:00
--log ~/train.log \
2022-01-15 20:10:06 +01:00
--after-epochs="$epochs"
#--vocabs "$source_vocab" "$target_vocab"
2022-01-14 19:08:32 +01:00
#--early-stopping 10 \
2022-01-14 19:11:01 +01:00
#--model model/model.npz
2022-01-14 18:45:36 +01:00
#--valid-log model/valid.log \
#--valid-metrics cross-entropy perplexity translation \
#--valid-sets data/valid.bpe.en data/valid.bpe.de \
#--valid-script-path ./scripts/validate.sh \
#--valid-translation-output data/valid.bpe.en.output --quiet-translation \
#--valid-mini-batch 64 \