mygo

Browse files

Files changed (17) hide show

Anon_v2/config.json +79 -0
README.md +94 -0
README_zh_CN.md +90 -0
Rana_v2/config.json +79 -0
Soyo0_v2/config.json +79 -0
Soyo1_v2/config.json +79 -0
Taki_v2/config.json +79 -0
Tomori_v2/config.json +79 -0
png/tanon1.png +0 -0
png/thina1.png +0 -0
png/tlisa1.png +0 -0
png/trana1.png +0 -0
png/tsayo1.png +0 -0
png/tsoyo1.png +0 -0
png/ttaki1.png +0 -0
png/ttomori1.png +0 -0
png/tyukina1.png +0 -0

Anon_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

README.md ADDED Viewed

	@@ -0,0 +1,94 @@

+---
+pipeline_tag: audio-to-audio
+tags:
+- RVC
+---
+# Voice Conversion Models for *BanG Dream!*
+&emsp;
+[**English**](./README.md) | [**中文简体**](./README_zh_CN.md)
+---
+Using RVC (Retrieval-based-Voice-Conversion-WebUI)
+[**RVC**](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)
+&emsp;
+RVC models for *BanG Dream!*, using voice data from bestdori.
+These models are aiming to facilitate communication and learning. Engaging in illegal activities, is strictly prohibited.
+&emsp;
+\*_v2 for v2, others for v1.
+(the v2 version model has changed the input from the 256 dimensional feature of 9-layer Hubert+final_proj to the 768 dimensional feature of 12-layer Hubert, and has added 3 period discriminators)
+---
+## character list
+### Poppin'Party
+### Afterglow
+### Hello, Happy World！
+### Pastel＊Palettes
+![hina](png/thina1.png)
+冰川 日菜
+Hina Hikawa
+### Roselia
+![sayo](png/tsayo1.png)
+冰川 纱夜
+Sayo Hikawa
+![yukina](png/tyukina1.png)
+凑 友希那
+Yukina Minato
+![lisa](png/tlisa1.png)
+今井 莉莎
+Lisa Imai
+### RAISE A SUILEN
+### Morfonica
+### MyGO!!!!!
+![anon](png/tanon1.png)
+千早 爱音
+Anon Chihaya
+![soyo](png/tsoyo1.png)
+长崎 爽世
+Soyo Nagasaki
+![tomori](png/ttomori1.png)
+高松 灯
+Tomori Takamatsu
+![taki](png/ttaki1.png)
+椎名 立希
+Taki Shiina
+![rana](png/trana1.png)
+要 乐奈
+Rana Kaname
+### Ave Mujica
+---
+## Links
+[**RVC(github)**](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)
+[**RVC(huggingface)**](https://huggingface.co/lj1995/VoiceConversionWebUI/tree/main)
+[**tutorial video for RVC**](https://www.bilibili.com/video/BV1pm4y1z7Gm)

README_zh_CN.md ADDED Viewed

	@@ -0,0 +1,90 @@

+# BanG Dream!角色语音转换模型
+&emsp;
+[**English**](./README.md) | [**中文简体**](./README_zh_CN.md)
+---
+使用 RVC (Retrieval-based-Voice-Conversion-WebUI)
+[**RVC**](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)
+&emsp;
+BanG Dream!角色RVC模型，以bestdori上的语音数据训练而成。
+仅供学习交流试用，不可用于非法用途。
+具体使用方法见：https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI/blob/main/README.md
+&emsp;
+带v2标识的模型为v2模型，无标识的模型皆为v1模型。
+(v2版本模型将特征从 9层hubert+final_proj的256维输入 变更为 12层hubert的768维输入，并且增加了3个周期鉴别器)
+---
+## 角色列表
+### Poppin'Party
+### Afterglow
+### Hello, Happy World！
+### Pastel＊Palettes
+![hina](png/thina1.png)
+冰川 日菜
+Hina Hikawa
+### Roselia
+![sayo](png/tsayo1.png)
+冰川 纱夜
+Sayo Hikawa
+![yukina](png/tyukina1.png)
+凑 友希那
+Yukina Minato
+![lisa](png/tlisa1.png)
+今井 莉莎
+Lisa Imai
+### RAISE A SUILEN
+### Morfonica
+### MyGO!!!!!
+![anon](png/tanon1.png)
+千早 爱音
+Anon Chihaya
+![soyo](png/tsoyo1.png)
+长崎 爽世
+Soyo Nagasaki
+![tomori](png/ttomori1.png)
+高松 灯
+Tomori Takamatsu
+![taki](png/ttaki1.png)
+椎名 立希
+Taki Shiina
+![rana](png/trana1.png)
+要 乐奈
+Rana Kaname
+### Ave Mujica
+---
+## 相关链接
+[**RVC(github)**](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)
+[**RVC(huggingface)**](https://huggingface.co/lj1995/VoiceConversionWebUI/tree/main)
+[**RVC视频教程**](https://www.bilibili.com/video/BV1pm4y1z7Gm)

Rana_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

Soyo0_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

Soyo1_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

Taki_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

Tomori_v2/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+    "data": {
+        "filter_length": 2048,
+        "hop_length": 400,
+        "max_wav_value": 32768.0,
+        "mel_fmax": null,
+        "mel_fmin": 0.0,
+        "n_mel_channels": 125,
+        "sampling_rate": 40000,
+        "win_length": 2048
+    },
+    "model": {
+        "filter_channels": 768,
+        "gin_channels": 256,
+        "hidden_channels": 192,
+        "inter_channels": 192,
+        "kernel_size": 3,
+        "n_heads": 2,
+        "n_layers": 6,
+        "p_dropout": 0,
+        "resblock": "1",
+        "resblock_dilation_sizes": [
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ],
+            [
+                1,
+                3,
+                5
+            ]
+        ],
+        "resblock_kernel_sizes": [
+            3,
+            7,
+            11
+        ],
+        "spk_embed_dim": 109,
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [
+            16,
+            16,
+            4,
+            4
+        ],
+        "upsample_rates": [
+            10,
+            10,
+            2,
+            2
+        ],
+        "use_spectral_norm": false
+    },
+    "train": {
+        "batch_size": 4,
+        "betas": [
+            0.8,
+            0.99
+        ],
+        "c_kl": 1.0,
+        "c_mel": 45,
+        "epochs": 20000,
+        "eps": 1e-09,
+        "fp16_run": true,
+        "init_lr_ratio": 1,
+        "learning_rate": 0.0001,
+        "log_interval": 200,
+        "lr_decay": 0.999875,
+        "seed": 1234,
+        "segment_size": 12800,
+        "warmup_epochs": 0
+    }
+}

png/tanon1.png ADDED Viewed

png/thina1.png ADDED Viewed

png/tlisa1.png ADDED Viewed

png/trana1.png ADDED Viewed

png/tsayo1.png ADDED Viewed

png/tsoyo1.png ADDED Viewed

png/ttaki1.png ADDED Viewed

png/ttomori1.png ADDED Viewed

png/tyukina1.png ADDED Viewed