Beka-pika
/

mms_kaz_tts

Inference Endpoints

Model card Files Files and versions Community

Beka-pika commited on Nov 7

Commit

1b7c129

•

1 Parent(s): f38c659

Upload model

Files changed (2) hide show

config.json +3 -4
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -1,8 +1,7 @@
 {
-  "_name_or_path": "./tmp/vits_finetuned_angry",
   "activation_dropout": 0.1,
   "architectures": [
-    "VitsModel"
   ],
   "attention_dropout": 0.1,
   "depth_separable_channels": 2,
@@ -52,7 +51,7 @@
   "noise_scale_duration": 0.8,
   "num_attention_heads": 2,
   "num_hidden_layers": 6,
-  "num_speakers": 2,
   "posterior_encoder_num_wavenet_layers": 16,
   "prior_encoder_num_flows": 4,
   "prior_encoder_num_wavenet_layers": 4,
@@ -80,7 +79,7 @@
   ],
   "sampling_rate": 16000,
   "segment_size": 8192,
-  "speaker_embedding_size": 256,
   "speaking_rate": 1.0,
   "spectrogram_bins": 513,
   "torch_dtype": "float32",

 {
   "activation_dropout": 0.1,
   "architectures": [
+    "VitsModelForPreTraining"
   ],
   "attention_dropout": 0.1,
   "depth_separable_channels": 2,
   "noise_scale_duration": 0.8,
   "num_attention_heads": 2,
   "num_hidden_layers": 6,
+  "num_speakers": 1,
   "posterior_encoder_num_wavenet_layers": 16,
   "prior_encoder_num_flows": 4,
   "prior_encoder_num_wavenet_layers": 4,
   ],
   "sampling_rate": 16000,
   "segment_size": 8192,
+  "speaker_embedding_size": 0,
   "speaking_rate": 1.0,
   "spectrogram_bins": 513,
   "torch_dtype": "float32",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f562a6266ca53658fa038f2924b726b4fe1f1a0d97bffc8a36943c84d67f773
-size 158643960

 version https://git-lfs.github.com/spec/v1
+oid sha256:288ebc5b047526f9a93b7bbdf32fbaa5cf73cbebdca9d16c1181580c3f273de7
+size 332164552