train_ctc.yaml 719 Bytes
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13
train-subset: train_asr
valid-subset: dev_asr

max-epoch: 50
max-update: 100000

num-workers: 8
patience: 10
no-progress-bar: True
log-interval: 100
seed: 1
report-accuracy: True

14 15
#load-pretrained-encoder-from:
#load-pretrained-decoder-from:
16 17 18 19 20 21 22 23

arch: s2t_transformer_s
share-decoder-input-output-embed: True
optimizer: adam
clip-norm: 10.0
lr-scheduler: inverse_sqrt
warmup-init-lr: 1e-7
warmup-updates: 10000
24
lr: 2e-3
25 26 27 28 29 30 31 32 33 34 35 36
#adam_betas: (0.9,0.98)

ctc-weight: 0.3
criterion: label_smoothed_cross_entropy_with_ctc
label_smoothing: 0.1

conv-kernel-sizes: 5,5
conv-channels: 1024
dropout: 0.1
activation-fn: relu
encoder-embed-dim: 256
encoder-ffn-embed-dim: 2048
xuchen committed
37
encoder-layers: 12
38
decoder-layers: 6
39
encoder-attention-heads: 4