EncoderDecoderASR update
Browse files- hyperparams.yaml +10 -7
hyperparams.yaml
CHANGED
|
@@ -139,7 +139,14 @@ lm_model: !new:speechbrain.lobes.models.transformer.TransformerLM.TransformerLM
|
|
| 139 |
activation: !name:torch.nn.GELU
|
| 140 |
normalize_before: False
|
| 141 |
|
| 142 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 143 |
embedding: !ref <emb>
|
| 144 |
decoder: !ref <dec>
|
| 145 |
linear: !ref <seq_lin>
|
|
@@ -162,13 +169,9 @@ beam_searcher: !new:speechbrain.decoders.S2SRNNBeamSearchTransformerLM
|
|
| 162 |
temperature_lm: !ref <temperature_lm>
|
| 163 |
|
| 164 |
modules:
|
| 165 |
-
|
| 166 |
-
|
| 167 |
-
asr_decoder: !ref <dec>
|
| 168 |
-
asr_model: !ref <asr_model>
|
| 169 |
-
normalize: !ref <normalize>
|
| 170 |
lm_model: !ref <lm_model>
|
| 171 |
-
beam_searcher: !ref <beam_searcher>
|
| 172 |
|
| 173 |
# The pretrainer allows a mapping between pretrained files and instances that
|
| 174 |
# are declared in the yaml.
|
|
|
|
| 139 |
activation: !name:torch.nn.GELU
|
| 140 |
normalize_before: False
|
| 141 |
|
| 142 |
+
# We compose the inference (encoder) pipeline.
|
| 143 |
+
encoder: !new:speechbrain.nnet.containers.LengthsCapableSequential
|
| 144 |
+
input_shape: [null, null, !ref <n_mels>]
|
| 145 |
+
compute_features: !ref <compute_features>
|
| 146 |
+
normalize: !ref <normalize>
|
| 147 |
+
model: !ref <enc>
|
| 148 |
+
|
| 149 |
+
decoder: !new:speechbrain.decoders.S2SRNNBeamSearchTransformerLM
|
| 150 |
embedding: !ref <emb>
|
| 151 |
decoder: !ref <dec>
|
| 152 |
linear: !ref <seq_lin>
|
|
|
|
| 169 |
temperature_lm: !ref <temperature_lm>
|
| 170 |
|
| 171 |
modules:
|
| 172 |
+
encoder: !ref <encoder>
|
| 173 |
+
decoder: !ref <decoder>
|
|
|
|
|
|
|
|
|
|
| 174 |
lm_model: !ref <lm_model>
|
|
|
|
| 175 |
|
| 176 |
# The pretrainer allows a mapping between pretrained files and instances that
|
| 177 |
# are declared in the yaml.
|