cemsubakan
commited on
Commit
•
25df5de
1
Parent(s):
b665af3
Update hyperparams.yaml
Browse files- hyperparams.yaml +12 -7
hyperparams.yaml
CHANGED
@@ -22,10 +22,10 @@ n_mels: 80
|
|
22 |
out_n_neurons: 50
|
23 |
|
24 |
# embedding_model: !new:custom_models.Conv2dEncoder_v2
|
25 |
-
embedding_model:
|
26 |
dim: 256
|
27 |
|
28 |
-
classifier:
|
29 |
input_size: 256
|
30 |
out_neurons: 50
|
31 |
lin_blocks: 1
|
@@ -38,25 +38,30 @@ n_fft: 1024
|
|
38 |
spec_mag_power: 0.5
|
39 |
hop_length: 11.6099
|
40 |
win_length: 23.2199
|
41 |
-
compute_stft:
|
42 |
n_fft: 1024
|
43 |
hop_length: 11.6099
|
44 |
win_length: 23.2199
|
45 |
sample_rate: 16000
|
46 |
|
47 |
-
compute_fbank:
|
48 |
n_mels: 80
|
49 |
n_fft: 1024
|
50 |
sample_rate: 16000
|
51 |
|
52 |
-
compute_istft:
|
53 |
sample_rate: 16000
|
54 |
hop_length: 11.6099
|
55 |
win_length: 23.2199
|
56 |
|
57 |
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
58 |
-
psi_model:
|
59 |
-
|
|
|
|
|
|
|
|
|
|
|
60 |
|
61 |
modules:
|
62 |
compute_stft: !ref <compute_stft>
|
|
|
22 |
out_n_neurons: 50
|
23 |
|
24 |
# embedding_model: !new:custom_models.Conv2dEncoder_v2
|
25 |
+
embedding_model: !new:speechbrain.lobes.models.PIQ.Conv2dEncoder_v2
|
26 |
dim: 256
|
27 |
|
28 |
+
classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
|
29 |
input_size: 256
|
30 |
out_neurons: 50
|
31 |
lin_blocks: 1
|
|
|
38 |
spec_mag_power: 0.5
|
39 |
hop_length: 11.6099
|
40 |
win_length: 23.2199
|
41 |
+
compute_stft: !new:speechbrain.processing.features.STFT
|
42 |
n_fft: 1024
|
43 |
hop_length: 11.6099
|
44 |
win_length: 23.2199
|
45 |
sample_rate: 16000
|
46 |
|
47 |
+
compute_fbank: !new:speechbrain.processing.features.Filterbank
|
48 |
n_mels: 80
|
49 |
n_fft: 1024
|
50 |
sample_rate: 16000
|
51 |
|
52 |
+
compute_istft: !new:speechbrain.processing.features.ISTFT
|
53 |
sample_rate: 16000
|
54 |
hop_length: 11.6099
|
55 |
win_length: 23.2199
|
56 |
|
57 |
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
58 |
+
psi_model: !new:speechbrain.lobes.models.PIQ.VectorQuantizedPSI_Audio
|
59 |
+
dim: 256
|
60 |
+
K: 1024
|
61 |
+
shared_keys: 0
|
62 |
+
activate_class_partitioning: true
|
63 |
+
use_adapter: true
|
64 |
+
adapter_reduce_dim: true
|
65 |
|
66 |
modules:
|
67 |
compute_stft: !ref <compute_stft>
|