forked from NVIDIA/NeMo
-
Notifications
You must be signed in to change notification settings - Fork 0
/
jasper_smaller.yaml
84 lines (72 loc) · 1.65 KB
/
jasper_smaller.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
model: "Jasper"
sample_rate: 16000
AudioToTextDataLayer:
train:
shuffle: true
eval:
shuffle: false
AudioPreprocessing:
normalize: "per_feature"
window_size: 0.02
window_stride: 0.01
window: "hann"
features: 64
n_fft: 512
frame_splicing: 1
dither: 0.00001
feat_type: "logfbank"
stft_conv: true
JasperEncoder:
activation: "relu"
jasper:
- filters: 256
repeat: 1
kernel: [11]
stride: [2]
dilation: [1]
dropout: 0.0
residual: false
- filters: 256
repeat: 3
kernel: [11]
stride: [1]
dilation: [1]
dropout: 0.1
residual: true
- filters: 512
repeat: 2
kernel: [17]
stride: [1]
dilation: [1]
dropout: 0.1
residual: true
- filters: 768
repeat: 1
kernel: [25]
stride: [1]
dilation: [1]
dropout: 0.1
residual: true
- filters: 1024
repeat: 1
kernel: [1]
stride: [1]
dilation: [1]
dropout: 0.2
residual: false
DecoderRNN:
hidden_size: 128
attention_method: "general"
attention_type: "post"
in_dropout: 0.2
rnn_dropout: 0.2
attn_dropout: 0.2
teacher_forcing: 0.6
curriculum_learning: 0.75
rnn_type: "lstm"
n_layers: 2
tie_emb_out_weights: true
load: false
freeze: false
labels: [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m",
"n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "'"]