Titouan
commited on
Commit
•
893e8fd
1
Parent(s):
d2aff8d
EncoderDecoderASR update
Browse files- hyperparams.yaml +10 -7
hyperparams.yaml
CHANGED
@@ -139,7 +139,14 @@ lm_model: !new:speechbrain.lobes.models.transformer.TransformerLM.TransformerLM
|
|
139 |
activation: !name:torch.nn.GELU
|
140 |
normalize_before: False
|
141 |
|
142 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
143 |
embedding: !ref <emb>
|
144 |
decoder: !ref <dec>
|
145 |
linear: !ref <seq_lin>
|
@@ -162,13 +169,9 @@ beam_searcher: !new:speechbrain.decoders.S2SRNNBeamSearchTransformerLM
|
|
162 |
temperature_lm: !ref <temperature_lm>
|
163 |
|
164 |
modules:
|
165 |
-
|
166 |
-
|
167 |
-
asr_decoder: !ref <dec>
|
168 |
-
asr_model: !ref <asr_model>
|
169 |
-
normalize: !ref <normalize>
|
170 |
lm_model: !ref <lm_model>
|
171 |
-
beam_searcher: !ref <beam_searcher>
|
172 |
|
173 |
# The pretrainer allows a mapping between pretrained files and instances that
|
174 |
# are declared in the yaml.
|
|
|
139 |
activation: !name:torch.nn.GELU
|
140 |
normalize_before: False
|
141 |
|
142 |
+
# We compose the inference (encoder) pipeline.
|
143 |
+
encoder: !new:speechbrain.nnet.containers.LengthsCapableSequential
|
144 |
+
input_shape: [null, null, !ref <n_mels>]
|
145 |
+
compute_features: !ref <compute_features>
|
146 |
+
normalize: !ref <normalize>
|
147 |
+
model: !ref <enc>
|
148 |
+
|
149 |
+
decoder: !new:speechbrain.decoders.S2SRNNBeamSearchTransformerLM
|
150 |
embedding: !ref <emb>
|
151 |
decoder: !ref <dec>
|
152 |
linear: !ref <seq_lin>
|
|
|
169 |
temperature_lm: !ref <temperature_lm>
|
170 |
|
171 |
modules:
|
172 |
+
encoder: !ref <encoder>
|
173 |
+
decoder: !ref <decoder>
|
|
|
|
|
|
|
174 |
lm_model: !ref <lm_model>
|
|
|
175 |
|
176 |
# The pretrainer allows a mapping between pretrained files and instances that
|
177 |
# are declared in the yaml.
|