forked from ishwnews/MASS
-
Notifications
You must be signed in to change notification settings - Fork 0
/
nmt_pretrained_with_mass.sh
executable file
·33 lines (32 loc) · 1.51 KB
/
nmt_pretrained_with_mass.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#DATA_PATH=YOUR_DATA_PATH
DATA_PATH=./pretrained-data/processed/
CUDA_VISIBLE_DEVICES=1 python train.py \
--exp_name unsupMT_enfr \
--dump_path ./models/en-fr/ \
--exp_id enfr_mass_single_gpu \
--data_path $DATA_PATH \
--lgs 'en-fr' \
--ae_steps 'en,fr' \
--bt_steps 'en-fr-en,fr-en-fr' \
--ms_steps 'en,fr' \
--word_shuffle 3 \
--word_dropout 0.1 \
--word_blank 0.1 \
--word_mass 0.25 \
--lambda_bt '0:0,100000:0' \
--lambda_ae '0:0,100000:0,300000:0' \
--encoder_only false \
--emb_dim 1024 \
--n_layers 6 \
--n_heads 8 \
--dropout 0.1 \
--attention_dropout 0.1 \
--gelu_activation true \
--tokens_per_batch 2000 \
--batch_size 32 \
--bptt 256 \
--optimizer adam_inverse_sqrt,beta1=0.9,beta2=0.98,lr=0.0001 \
--epoch_size 200000 \
--eval_bleu true \
--min_len 10 \
--max_epoch 20