forked from lovecambi/qebrain
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathexp_train.sh
executable file
·40 lines (36 loc) · 1.01 KB
/
exp_train.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
datadir=./data/para
vocabdir=./data/vocab
modeldir=./saved_exp_model
mkdir -p $modeldir
rm -rf $modeldir/*
# batch_size is token level.
# infer_batch_size is example level.
python expert_model.py \
--src=lower.de \
--tgt=lower.en \
--train_prefix=${datadir}/train \
--dev_prefix=${datadir}/dev \
--test_prefix=${datadir}/dev \
--vocab_prefix=${vocabdir}/vocab120k \
--max_vocab_size=120000 \
--out_dir=${modeldir} \
--optimizer=lazyadam \
--warmup_steps=8000 \
--learning_rate=2.1 \
--num_train_steps=500000 \
--steps_per_stats=100 \
--steps_per_external_eval=1000 \
--embedding_size=512 \
--num_units=512 \
--num_layers=2 \
--ffn_inner_dim=512 \
--batch_size=1024 \
--infer_batch_size=64 \
--metrics=BLEU \
--bucket_width=5 \
--avg_ckpts=True \
--label_smoothing=0.1 \
--src_max_len=70 \
--tgt_max_len=70 \
--num_gpus=8