Upload 6 files

Browse files

Files changed (6) hide show

classifier.ckpt +3 -0
config.json +3 -0
embedding_model.ckpt +3 -0
hyperparams.yaml +63 -0
label_encoder.txt +0 -0
mean_var_norm_emb.ckpt +3 -0

classifier.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f7ea89eb44b3a3e8e3b957b8a473f9b024c2686e95170963223d2182ff1c076
+size 13207403

config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "speechbrain_interface": "EncoderClassifier"
+}

embedding_model.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:17890d7a013d36d71071599cb0ac720b673b5b16863c8e1ad769c3ce525b57d3
+size 16887086

hyperparams.yaml ADDED Viewed

	@@ -0,0 +1,63 @@

+# ############################################################################
+# Model: xvector for Speaker verification
+# ############################################################################
+# Feature parameters
+n_mels: 24
+# Pretrain folder (HuggingFace)
+pretrained_path: team-lucid/spkrec-xvect-korean
+# Output parameters
+out_n_neurons: 5914
+# Model params
+compute_features: !new:speechbrain.lobes.features.Fbank
+    n_mels: !ref <n_mels>
+mean_var_norm: !new:speechbrain.processing.features.InputNormalization
+    norm_type: sentence
+    std_norm: False
+embedding_model: !new:speechbrain.lobes.models.Xvector.Xvector
+    in_channels: !ref <n_mels>
+    activation: !name:torch.nn.LeakyReLU
+    tdnn_blocks: 5
+    tdnn_channels: [512, 512, 512, 512, 1500]
+    tdnn_kernel_sizes: [5, 3, 3, 1, 1]
+    tdnn_dilations: [1, 2, 3, 1, 1]
+    lin_neurons: 512
+classifier: !new:speechbrain.lobes.models.Xvector.Classifier
+    input_shape: [null, null, 512]
+    activation: !name:torch.nn.LeakyReLU
+    lin_blocks: 1
+    lin_neurons: 512
+    out_neurons: !ref <out_n_neurons>
+mean_var_norm_emb: !new:speechbrain.processing.features.InputNormalization
+    norm_type: global
+    std_norm: False
+modules:
+    compute_features: !ref <compute_features>
+    mean_var_norm: !ref <mean_var_norm>
+    embedding_model: !ref <embedding_model>
+    mean_var_norm_emb: !ref <mean_var_norm_emb>
+    classifier: !ref <classifier>
+label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
+pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
+    loadables:
+        embedding_model: !ref <embedding_model>
+        mean_var_norm_emb: !ref <mean_var_norm_emb>
+        classifier: !ref <classifier>
+        label_encoder: !ref <label_encoder>
+    paths:
+        embedding_model: !ref <pretrained_path>/embedding_model.ckpt
+        mean_var_norm_emb: !ref <pretrained_path>/mean_var_norm_emb.ckpt
+        classifier: !ref <pretrained_path>/classifier.ckpt
+        label_encoder: !ref <pretrained_path>/label_encoder.txt

label_encoder.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

mean_var_norm_emb.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26438e2995f675d14eb728a7e794794526db4c4d4c3fa06f7ba48e2e211a3341
+size 1167