sate_big_pds.yaml 1.18 KB
Newer Older
1 2 3 4 5 6 7
arch: s2t_sate
share-decoder-input-output-embed: True
optimizer: adam
clip-norm: 10.0
lr-scheduler: inverse_sqrt
warmup-init-lr: 1e-7
warmup-updates: 10000
xuchen committed
8 9
lr: 1e-3
adam_betas: (0.9,0.98)
10 11 12 13 14 15

criterion: label_smoothed_cross_entropy_with_ctc
label_smoothing: 0.1

encoder-normalize-before: True
decoder-normalize-before: True
16
subsampling-type: conv1d
17
subsampling-layers: 2
xuchen committed
18
subsampling-filter: 2048
19 20 21 22 23
subsampling-kernel: 5
subsampling-stride: 2
subsampling-norm: none
subsampling-activation: glu

xuchen committed
24
dropout: 0.15
25 26 27 28 29
activation-fn: relu
encoder-ffn-embed-dim: 2048
encoder-layers: 12
text-encoder-layers: 6
decoder-layers: 6
xuchen committed
30
encoder-attention-heads: 8
31

xuchen committed
32 33 34
decoder-embed-dim: 512
decoder-ffn-embed-dim: 2048
decoder-attention-heads: 8
35

xuchen committed
36
acoustic-encoder: pds
37 38
adapter: league

xuchen committed
39 40
encoder-embed-dim: 512
ctc-layer: 12
41 42 43 44 45
pds-stages: 4
pds-layers: 3_3_3_3
pds-ratios: 2_2_1_2
pds-fusion: True
pds-fusion-method: all_conv
xuchen committed
46
pds-embed-dims: 512_512_512_512
47 48 49 50
pds-ds-method: conv
pds-embed-norm: True
pds-position-embed: 1_1_1_1
pds-kernel-sizes: 5_5_5_5
xuchen committed
51 52
pds-ffn-ratios: 4_4_4_4
pds-attn-heads: 8_8_8_8
53

xuchen committed
54 55 56 57
#load-pretrained-encoder-from:
#load-pretrained-acoustic-encoder-from:
#load-pretrained-text-encoder-from:
#load-pretrained-decoder-from: