speechbrain
/

asr-crdnn-transformerlm-librispeech

Automatic Speech Recognition

Model card Files Files and versions Community

Adel-Moumen commited on Feb 19, 2024

Commit

21f99db

·

verified ·

1 Parent(s): 62d3aed

Update hyperparams.yaml

Files changed (1) hide show

hyperparams.yaml +25 -9

hyperparams.yaml CHANGED Viewed

@@ -146,27 +146,43 @@ encoder: !new:speechbrain.nnet.containers.LengthsCapableSequential
     normalize: !ref <normalizer>
     model: !ref <enc>
-decoder: !new:speechbrain.decoders.S2SRNNBeamSearchTransformerLM
    embedding: !ref <emb>
    decoder: !ref <dec>
    linear: !ref <seq_lin>
-   ctc_linear: !ref <ctc_lin>
-   language_model: !ref <lm_model>
    bos_index: !ref <bos_index>
    eos_index: !ref <eos_index>
-   blank_index: !ref <blank_index>
    min_decode_ratio: !ref <min_decode_ratio>
    max_decode_ratio: !ref <max_decode_ratio>
    beam_size: !ref <beam_size>
    eos_threshold: !ref <eos_threshold>
    using_max_attn_shift: !ref <using_max_attn_shift>
    max_attn_shift: !ref <max_attn_shift>
-   coverage_penalty: !ref <coverage_penalty>
-   lm_weight: !ref <lm_weight>
-   ctc_weight: !ref <ctc_weight_decode>
-   ctc_window_size: !ref <ctc_window_size>
    temperature: !ref <temperature>
-   temperature_lm: !ref <temperature_lm>
 modules:
    normalizer: !ref <normalizer>

     normalize: !ref <normalizer>
     model: !ref <enc>
+# Scorer
+ctc_scorer: !new:speechbrain.decoders.scorer.CTCScorer
+    eos_index: !ref <eos_index>
+    blank_index: !ref <blank_index>
+    ctc_fc: !ref <ctc_lin>
+    ctc_window_size: !ref <ctc_window_size>
+transformerlm_scorer: !new:speechbrain.decoders.scorer.TransformerLMScorer
+   language_model: !ref <lm_model>
+   temperature: !ref <temperature_lm>
+coverage_scorer: !new:speechbrain.decoders.scorer.CoverageScorer
+   vocab_size: !ref <output_neurons>
+scorer: !new:speechbrain.decoders.scorer.ScorerBuilder
+   full_scorers: [!ref <transformerlm_scorer>,
+                  !ref <coverage_scorer>],
+                  !ref <ctc_scorer>]
+   weights:
+      transformerlm: !ref <lm_weight>
+      coverage_scorer: !ref <coverage_penalty>
+      ctc: !ref <ctc_weight_decode>
+decoder: !new:speechbrain.decoders.S2SRNNBeamSearcher
    embedding: !ref <emb>
    decoder: !ref <dec>
    linear: !ref <seq_lin>
    bos_index: !ref <bos_index>
    eos_index: !ref <eos_index>
    min_decode_ratio: !ref <min_decode_ratio>
    max_decode_ratio: !ref <max_decode_ratio>
    beam_size: !ref <beam_size>
    eos_threshold: !ref <eos_threshold>
    using_max_attn_shift: !ref <using_max_attn_shift>
    max_attn_shift: !ref <max_attn_shift>
    temperature: !ref <temperature>
+   scorer: !ref <scorer>
 modules:
    normalizer: !ref <normalizer>