-
Notifications
You must be signed in to change notification settings - Fork 75
/
train.simul-s2st.sh
executable file
·34 lines (32 loc) · 1.61 KB
/
train.simul-s2st.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
export CUDA_VISIBLE_DEVICES=0,1,2,3
LANG=fr
DATA_ROOT=/data/zhangshaolei/datasets/cvss/cvss-c
DATA=$DATA_ROOT/${LANG}-en/fbank2unit
model=streamspeech.simul-s2st.${LANG}-en
fairseq-train $DATA \
--user-dir researches/ctc_unity \
--config-yaml config_gcmvn.yaml --multitask-config-yaml config_mtl_asr_st_ctcst.yaml \
--task speech_to_speech_ctc --target-is-code --target-code-size 1000 --vocoder code_hifigan \
--criterion speech_to_unit_2pass_ctc_asr_st --label-smoothing 0.1 --rdrop-alpha 0.0 \
--arch streamspeech --share-decoder-input-output-embed \
--encoder-layers 12 --encoder-embed-dim 256 --encoder-ffn-embed-dim 2048 --encoder-attention-heads 4 \
--translation-decoder-layers 4 --synthesizer-encoder-layers 2 \
--decoder-layers 2 --decoder-embed-dim 512 --decoder-ffn-embed-dim 2048 --decoder-attention-heads 8 \
--k1 0 --k2 0 --n1 1 --n2 -1 \
--chunk-size 8 --multichunk \
--uni-encoder \
--dropout 0.1 --attention-dropout 0.1 --relu-dropout 0.1 \
--train-subset train --valid-subset dev \
--ctc-upsample-rate 25 \
--save-dir checkpoints/$model \
--validate-interval 1000 --validate-interval-updates 1000 \
--save-interval 1 --save-interval-updates 1000 \
--keep-last-epochs 15 \
--no-progress-bar --log-format json --log-interval 100 \
--lr 0.001 --lr-scheduler inverse_sqrt --warmup-init-lr 1e-7 --warmup-updates 10000 \
--optimizer adam --adam-betas "(0.9,0.98)" --clip-norm 1.0 \
--max-tokens 22000 --max-target-positions 1200 --update-freq 2 \
--attn-type espnet --pos-enc-type rel_pos \
--keep-interval-updates 40 \
--keep-best-checkpoints 20 \
--seed 1 --fp16 --num-workers 8