Update hyperparams.yaml
Browse files- hyperparams.yaml +25 -9
hyperparams.yaml
CHANGED
@@ -146,27 +146,43 @@ encoder: !new:speechbrain.nnet.containers.LengthsCapableSequential
|
|
146 |
normalize: !ref <normalizer>
|
147 |
model: !ref <enc>
|
148 |
|
149 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
150 |
embedding: !ref <emb>
|
151 |
decoder: !ref <dec>
|
152 |
linear: !ref <seq_lin>
|
153 |
-
ctc_linear: !ref <ctc_lin>
|
154 |
-
language_model: !ref <lm_model>
|
155 |
bos_index: !ref <bos_index>
|
156 |
eos_index: !ref <eos_index>
|
157 |
-
blank_index: !ref <blank_index>
|
158 |
min_decode_ratio: !ref <min_decode_ratio>
|
159 |
max_decode_ratio: !ref <max_decode_ratio>
|
160 |
beam_size: !ref <beam_size>
|
161 |
eos_threshold: !ref <eos_threshold>
|
162 |
using_max_attn_shift: !ref <using_max_attn_shift>
|
163 |
max_attn_shift: !ref <max_attn_shift>
|
164 |
-
coverage_penalty: !ref <coverage_penalty>
|
165 |
-
lm_weight: !ref <lm_weight>
|
166 |
-
ctc_weight: !ref <ctc_weight_decode>
|
167 |
-
ctc_window_size: !ref <ctc_window_size>
|
168 |
temperature: !ref <temperature>
|
169 |
-
|
170 |
|
171 |
modules:
|
172 |
normalizer: !ref <normalizer>
|
|
|
146 |
normalize: !ref <normalizer>
|
147 |
model: !ref <enc>
|
148 |
|
149 |
+
# Scorer
|
150 |
+
ctc_scorer: !new:speechbrain.decoders.scorer.CTCScorer
|
151 |
+
eos_index: !ref <eos_index>
|
152 |
+
blank_index: !ref <blank_index>
|
153 |
+
ctc_fc: !ref <ctc_lin>
|
154 |
+
ctc_window_size: !ref <ctc_window_size>
|
155 |
+
|
156 |
+
transformerlm_scorer: !new:speechbrain.decoders.scorer.TransformerLMScorer
|
157 |
+
language_model: !ref <lm_model>
|
158 |
+
temperature: !ref <temperature_lm>
|
159 |
+
|
160 |
+
coverage_scorer: !new:speechbrain.decoders.scorer.CoverageScorer
|
161 |
+
vocab_size: !ref <output_neurons>
|
162 |
+
|
163 |
+
scorer: !new:speechbrain.decoders.scorer.ScorerBuilder
|
164 |
+
full_scorers: [!ref <transformerlm_scorer>,
|
165 |
+
!ref <coverage_scorer>],
|
166 |
+
!ref <ctc_scorer>]
|
167 |
+
weights:
|
168 |
+
transformerlm: !ref <lm_weight>
|
169 |
+
coverage_scorer: !ref <coverage_penalty>
|
170 |
+
ctc: !ref <ctc_weight_decode>
|
171 |
+
|
172 |
+
decoder: !new:speechbrain.decoders.S2SRNNBeamSearcher
|
173 |
embedding: !ref <emb>
|
174 |
decoder: !ref <dec>
|
175 |
linear: !ref <seq_lin>
|
|
|
|
|
176 |
bos_index: !ref <bos_index>
|
177 |
eos_index: !ref <eos_index>
|
|
|
178 |
min_decode_ratio: !ref <min_decode_ratio>
|
179 |
max_decode_ratio: !ref <max_decode_ratio>
|
180 |
beam_size: !ref <beam_size>
|
181 |
eos_threshold: !ref <eos_threshold>
|
182 |
using_max_attn_shift: !ref <using_max_attn_shift>
|
183 |
max_attn_shift: !ref <max_attn_shift>
|
|
|
|
|
|
|
|
|
184 |
temperature: !ref <temperature>
|
185 |
+
scorer: !ref <scorer>
|
186 |
|
187 |
modules:
|
188 |
normalizer: !ref <normalizer>
|