-
Notifications
You must be signed in to change notification settings - Fork 19
/
Copy pathscripts-transfomer-iwslt-envi.sh
38 lines (33 loc) · 6.1 KB
/
scripts-transfomer-iwslt-envi.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
# make data
python2.7 scripts/wrap-data.py en vi /nfs/project/nmt/space_vh/tmp/envi/train sample-data/tst2012 sample-data/tst2013 sample-data/vocab
# full data
# use all available vocabularies in vocab.en and vocab.vi
# small model
mkdir experiments/models/envi/small
./build_gpu/transformer-train --dynet-devices GPU:1 --max-seq-len 150 --minibatch-size 1024 --treport 1000 --dreport 50000 --src-vocab sample-data/vocab.en --tgt-vocab sample-data/vocab.vi -t /nfs/project/nmt/space_vh/tmp/envi/train.en-vi.capped -d sample-data/tst2012.en-vi.capped -p experiments/models/envi/small -e 100 --lr-eta 0.1 --lr-patience 8 --patience 15 --lr-eta-decay 1.5 --encoder-emb-dropout-p 0.1 --encoder-sublayer-dropout-p 0.1 --decoder-emb-dropout-p 0.1 --decoder-sublayer-dropout-p 0.1 --attention-dropout-p 0.1 --ff-dropout-p 0.1 --ff-activation-type 1 --nlayers 2 --num-units 128 --num-heads 2 --use-label-smoothing --label-smoothing-weight 0.1 --position-encoding 2 --reset-if-stuck &>experiments/models/envi/small/train.en-vi.transformer.base_h2_l2_u128_do010101010101_att1_ls01_pe2_ml150_ffrelu.log &
# decode
./build_gpu/transformer-decode --dynet-devices GPU:1 --model-path experiments/models/envi/small --beam 5 -T sample-data/tst2013.en.capped | sed 's/<s> //g' | sed 's/ <\/s>//g' > experiments/models/envi/small/translation-beam5.en-vi.transformer.base_h2_l2_u128_do010101010101_att1_ls01_pe2_ml150_ffrelu
/nfs/team/nlp/users/vhoang/tools/mosesdecoder/scripts/generic/multi-bleu.perl sample-data/tst2013.vi < experiments/models/envi/small/translation-beam5.en-vi.transformer.base_h2_l2_u128_do010101010101_att1_ls01_pe2_ml150_ffrelu
# medium models
# run1
mkdir experiments/models/envi/run1
./build_gpu/transformer-train --dynet-devices GPU:1 --max-seq-len 150 --minibatch-size 1024 --treport 1000 --dreport 50000 --src-vocab sample-data/vocab.en --tgt-vocab sample-data/vocab.vi -t /nfs/project/nmt/space_vh/tmp/envi/train.en-vi.capped -d sample-data/tst2012.en-vi.capped -p experiments/models/envi/run1 -e 100 --lr-eta 0.1 --lr-patience 8 --patience 15 --lr-eta-decay 1.5 --encoder-emb-dropout-p 0.1 --encoder-sublayer-dropout-p 0.1 --decoder-emb-dropout-p 0.1 --decoder-sublayer-dropout-p 0.1 --attention-dropout-p 0.1 --ff-dropout-p 0.1 --ff-activation-type 1 --nlayers 4 --num-units 512 --num-heads 4 --use-label-smoothing --label-smoothing-weight 0.1 --position-encoding 2 --reset-if-stuck &>experiments/models/envi/run1/train.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu.log &
# decode
./build_gpu/transformer-decode --dynet-devices GPU:1 --model-path experiments/models/envi/run1 --beam 5 -T sample-data/tst2013.en.capped | sed 's/<s> //g' | sed 's/ <\/s>//g' > experiments/models/envi/run1/translation-beam5.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
/nfs/team/nlp/users/vhoang/tools/mosesdecoder/scripts/generic/multi-bleu.perl sample-data/tst2013.vi < experiments/models/envi/run1/translation-beam5.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
# run 2
mkdir experiments/models/envi/run2
./build_gpu/transformer-train --dynet-devices GPU:1 --max-seq-len 150 --minibatch-size 1024 --treport 1000 --dreport 50000 --src-vocab sample-data/vocab.en --tgt-vocab sample-data/vocab.vi -t /nfs/project/nmt/space_vh/tmp/envi/train.en-vi.capped -d sample-data/tst2012.en-vi.capped -p experiments/models/envi/run2 -e 100 --lr-eta 0.1 --lr-patience 8 --patience 15 --lr-eta-decay 1.5 --encoder-emb-dropout-p 0.1 --encoder-sublayer-dropout-p 0.1 --decoder-emb-dropout-p 0.1 --decoder-sublayer-dropout-p 0.1 --attention-dropout-p 0.1 --ff-dropout-p 0.1 --ff-activation-type 1 --nlayers 4 --num-units 512 --num-heads 4 --use-label-smoothing --label-smoothing-weight 0.1 --position-encoding 2 --reset-if-stuck &>experiments/models/envi/run2/train.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu.log &
# decode
./build_gpu/transformer-decode --dynet-devices GPU:1 --model-path experiments/models/envi/run2 --beam 5 -T sample-data/tst2013.en.capped | sed 's/<s> //g' | sed 's/ <\/s>//g' > experiments/models/envi/run2/translation-beam5.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
/nfs/team/nlp/users/vhoang/tools/mosesdecoder/scripts/generic/multi-bleu.perl sample-data/tst2013.vi < experiments/models/envi/run2/translation-beam5.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
# ensemble 2 runs
mkdir experiments/models/envi/ensemble_2runs
cp experiments/models/envi/run1/*.vocab experiments/models/envi/ensemble_2runs
for f in experiments/models/envi/run1/model.config experiments/models/envi/run2/model.config; do (cat "${f}"; echo) >> experiments/models/envi/ensemble_2runs/model.config; done
# tst2012
./build_gpu/transformer-decode --dynet-devices GPU:1 --model-path experiments/models/envi/ensemble_2runs --beam 5 -T sample-data/tst2012.en.capped | sed 's/<s> //g' | sed 's/ <\/s>//g' > experiments/models/envi/ensemble_2runs/translation-beam5.tst2012.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
/nfs/team/nlp/users/vhoang/tools/mosesdecoder/scripts/generic/multi-bleu.perl sample-data/tst2012.vi < experiments/models/envi/ensemble_2runs/translation-beam5.tst2012.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu > experiments/models/envi/ensemble_2runs/translation-beam5.tst2012.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu.scoreBLEU
# tst2013
./build_gpu/transformer-decode --dynet-devices GPU:1 --model-path experiments/models/envi/ensemble_2runs --beam 5 -T sample-data/tst2013.en.capped | sed 's/<s> //g' | sed 's/ <\/s>//g' > experiments/models/envi/ensemble_2runs/translation-beam5.tst2013.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu
/nfs/team/nlp/users/vhoang/tools/mosesdecoder/scripts/generic/multi-bleu.perl sample-data/tst2013.vi < experiments/models/envi/ensemble_2runs/translation-beam5.tst2013.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu > experiments/models/envi/ensemble_2runs/translation-beam5.tst2013.en-vi.transformer.base_h4_l4_u512_do010101010101_att1_ls01_pe2_ml150_ffrelu.scoreBLEU