Kit-Lemonfoot commited on
Commit
d12a1c3
1 Parent(s): 9b6e37e

Delete old model_assets

Browse files
model_assets/jvnv-F1/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "model_name": "jvnv-F1",
3
- "train": {
4
- "log_interval": 200,
5
- "eval_interval": 1000,
6
- "seed": 42,
7
- "epochs": 500,
8
- "learning_rate": 0.0002,
9
- "betas": [0.8, 0.99],
10
- "eps": 1e-9,
11
- "batch_size": 4,
12
- "bf16_run": true,
13
- "lr_decay": 0.99995,
14
- "segment_size": 16384,
15
- "init_lr_ratio": 1,
16
- "warmup_epochs": 0,
17
- "c_mel": 45,
18
- "c_kl": 1.0,
19
- "skip_optimizer": false,
20
- "freeze_ZH_bert": false,
21
- "freeze_JP_bert": false,
22
- "freeze_EN_bert": false
23
- },
24
- "data": {
25
- "training_files": "Data/jvnv-F1/train.list",
26
- "validation_files": "Data/jvnv-F1/val.list",
27
- "max_wav_value": 32768.0,
28
- "sampling_rate": 44100,
29
- "filter_length": 2048,
30
- "hop_length": 512,
31
- "win_length": 2048,
32
- "n_mel_channels": 128,
33
- "mel_fmin": 0.0,
34
- "mel_fmax": null,
35
- "add_blank": true,
36
- "n_speakers": 1,
37
- "cleaned_text": true,
38
- "num_styles": 7,
39
- "style2id": {
40
- "Neutral": 0,
41
- "Angry": 1,
42
- "Disgust": 2,
43
- "Fear": 3,
44
- "Happy": 4,
45
- "Sad": 5,
46
- "Surprise": 6
47
- },
48
- "spk2id": {
49
- "jvnv-F1": 0
50
- }
51
- },
52
- "model": {
53
- "use_spk_conditioned_encoder": true,
54
- "use_noise_scaled_mas": true,
55
- "use_mel_posterior_encoder": false,
56
- "use_duration_discriminator": true,
57
- "inter_channels": 192,
58
- "hidden_channels": 192,
59
- "filter_channels": 768,
60
- "n_heads": 2,
61
- "n_layers": 6,
62
- "kernel_size": 3,
63
- "p_dropout": 0.1,
64
- "resblock": "1",
65
- "resblock_kernel_sizes": [3, 7, 11],
66
- "resblock_dilation_sizes": [
67
- [1, 3, 5],
68
- [1, 3, 5],
69
- [1, 3, 5]
70
- ],
71
- "upsample_rates": [8, 8, 2, 2, 2],
72
- "upsample_initial_channel": 512,
73
- "upsample_kernel_sizes": [16, 16, 8, 2, 2],
74
- "n_layers_q": 3,
75
- "use_spectral_norm": false,
76
- "gin_channels": 256
77
- },
78
- "version": "1.0"
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
model_assets/jvnv-F1/jvnv-F1.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:62c45494f0222888f9e8834ba3ccdc7cb53024e67b6f9903ceff4c011d44630c
3
- size 198768188
 
 
 
 
model_assets/jvnv-F1/style_vectors.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f959bb45ed0922efc31ff24e9147253814f42cb1d2d1e2bb10391a9df368489
3
- size 7296
 
 
 
 
model_assets/jvnv-F2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "model_name": "jvnv-F2",
3
- "train": {
4
- "log_interval": 200,
5
- "eval_interval": 1000,
6
- "seed": 42,
7
- "epochs": 500,
8
- "learning_rate": 0.0002,
9
- "betas": [0.8, 0.99],
10
- "eps": 1e-9,
11
- "batch_size": 4,
12
- "bf16_run": true,
13
- "lr_decay": 0.99995,
14
- "segment_size": 16384,
15
- "init_lr_ratio": 1,
16
- "warmup_epochs": 0,
17
- "c_mel": 45,
18
- "c_kl": 1.0,
19
- "skip_optimizer": false,
20
- "freeze_ZH_bert": false,
21
- "freeze_JP_bert": false,
22
- "freeze_EN_bert": false
23
- },
24
- "data": {
25
- "training_files": "Data/jvnv-F2/train.list",
26
- "validation_files": "Data/jvnv-F2/val.list",
27
- "max_wav_value": 32768.0,
28
- "sampling_rate": 44100,
29
- "filter_length": 2048,
30
- "hop_length": 512,
31
- "win_length": 2048,
32
- "n_mel_channels": 128,
33
- "mel_fmin": 0.0,
34
- "mel_fmax": null,
35
- "add_blank": true,
36
- "n_speakers": 1,
37
- "cleaned_text": true,
38
- "num_styles": 7,
39
- "style2id": {
40
- "Neutral": 0,
41
- "Angry": 1,
42
- "Disgust": 2,
43
- "Fear": 3,
44
- "Happy": 4,
45
- "Sad": 5,
46
- "Surprise": 6
47
- },
48
- "spk2id": {
49
- "jvnv-F2": 0
50
- }
51
- },
52
- "model": {
53
- "use_spk_conditioned_encoder": true,
54
- "use_noise_scaled_mas": true,
55
- "use_mel_posterior_encoder": false,
56
- "use_duration_discriminator": true,
57
- "inter_channels": 192,
58
- "hidden_channels": 192,
59
- "filter_channels": 768,
60
- "n_heads": 2,
61
- "n_layers": 6,
62
- "kernel_size": 3,
63
- "p_dropout": 0.1,
64
- "resblock": "1",
65
- "resblock_kernel_sizes": [3, 7, 11],
66
- "resblock_dilation_sizes": [
67
- [1, 3, 5],
68
- [1, 3, 5],
69
- [1, 3, 5]
70
- ],
71
- "upsample_rates": [8, 8, 2, 2, 2],
72
- "upsample_initial_channel": 512,
73
- "upsample_kernel_sizes": [16, 16, 8, 2, 2],
74
- "n_layers_q": 3,
75
- "use_spectral_norm": false,
76
- "gin_channels": 256
77
- },
78
- "version": "1.0"
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
model_assets/jvnv-F2/jvnv-F2.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7408a75ec677d461a8e959d3f2fed5256deaa8691fd841672e0a368007f9b682
3
- size 198768188
 
 
 
 
model_assets/jvnv-F2/style_vectors.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:900f8cde3a336d12193fec7b7d8e6c5dc77b3a5d719a9be3f8598389cd88e643
3
- size 7296
 
 
 
 
model_assets/jvnv-M1/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "model_name": "jvnv-M1",
3
- "train": {
4
- "log_interval": 200,
5
- "eval_interval": 1000,
6
- "seed": 42,
7
- "epochs": 500,
8
- "learning_rate": 0.0002,
9
- "betas": [0.8, 0.99],
10
- "eps": 1e-9,
11
- "batch_size": 4,
12
- "bf16_run": true,
13
- "lr_decay": 0.99995,
14
- "segment_size": 16384,
15
- "init_lr_ratio": 1,
16
- "warmup_epochs": 0,
17
- "c_mel": 45,
18
- "c_kl": 1.0,
19
- "skip_optimizer": false,
20
- "freeze_ZH_bert": false,
21
- "freeze_JP_bert": false,
22
- "freeze_EN_bert": false
23
- },
24
- "data": {
25
- "training_files": "Data/jvnv-M1/train.list",
26
- "validation_files": "Data/jvnv-M1/val.list",
27
- "max_wav_value": 32768.0,
28
- "sampling_rate": 44100,
29
- "filter_length": 2048,
30
- "hop_length": 512,
31
- "win_length": 2048,
32
- "n_mel_channels": 128,
33
- "mel_fmin": 0.0,
34
- "mel_fmax": null,
35
- "add_blank": true,
36
- "n_speakers": 1,
37
- "cleaned_text": true,
38
- "num_styles": 7,
39
- "style2id": {
40
- "Neutral": 0,
41
- "Angry": 1,
42
- "Disgust": 2,
43
- "Fear": 3,
44
- "Happy": 4,
45
- "Sad": 5,
46
- "Surprise": 6
47
- },
48
- "spk2id": {
49
- "jvnv-M1": 0
50
- }
51
- },
52
- "model": {
53
- "use_spk_conditioned_encoder": true,
54
- "use_noise_scaled_mas": true,
55
- "use_mel_posterior_encoder": false,
56
- "use_duration_discriminator": true,
57
- "inter_channels": 192,
58
- "hidden_channels": 192,
59
- "filter_channels": 768,
60
- "n_heads": 2,
61
- "n_layers": 6,
62
- "kernel_size": 3,
63
- "p_dropout": 0.1,
64
- "resblock": "1",
65
- "resblock_kernel_sizes": [3, 7, 11],
66
- "resblock_dilation_sizes": [
67
- [1, 3, 5],
68
- [1, 3, 5],
69
- [1, 3, 5]
70
- ],
71
- "upsample_rates": [8, 8, 2, 2, 2],
72
- "upsample_initial_channel": 512,
73
- "upsample_kernel_sizes": [16, 16, 8, 2, 2],
74
- "n_layers_q": 3,
75
- "use_spectral_norm": false,
76
- "gin_channels": 256
77
- },
78
- "version": "1.2"
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
model_assets/jvnv-M1/jvnv-M1.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:397cc7e0b8ea1e290a7049802c2894315381ad84657947779078f79a36e98729
3
- size 198768188
 
 
 
 
model_assets/jvnv-M1/style_vectors.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a925435e8c1c9efc8fc8e90e690655ab9a7bae00a790892e13e936510d04f05
3
- size 7296
 
 
 
 
model_assets/jvnv-M2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "model_name": "jvnv-M2",
3
- "train": {
4
- "log_interval": 200,
5
- "eval_interval": 1000,
6
- "seed": 42,
7
- "epochs": 300,
8
- "learning_rate": 0.0002,
9
- "betas": [0.8, 0.99],
10
- "eps": 1e-9,
11
- "batch_size": 4,
12
- "bf16_run": true,
13
- "lr_decay": 0.99995,
14
- "segment_size": 16384,
15
- "init_lr_ratio": 1,
16
- "warmup_epochs": 0,
17
- "c_mel": 45,
18
- "c_kl": 1.0,
19
- "skip_optimizer": false,
20
- "freeze_ZH_bert": false,
21
- "freeze_JP_bert": false,
22
- "freeze_EN_bert": false
23
- },
24
- "data": {
25
- "training_files": "Data/jvnv-M2/train.list",
26
- "validation_files": "Data/jvnv-M2/val.list",
27
- "max_wav_value": 32768.0,
28
- "sampling_rate": 44100,
29
- "filter_length": 2048,
30
- "hop_length": 512,
31
- "win_length": 2048,
32
- "n_mel_channels": 128,
33
- "mel_fmin": 0.0,
34
- "mel_fmax": null,
35
- "add_blank": true,
36
- "n_speakers": 1,
37
- "cleaned_text": true,
38
- "num_styles": 7,
39
- "style2id": {
40
- "Neutral": 0,
41
- "Angry": 1,
42
- "Disgust": 2,
43
- "Fear": 3,
44
- "Happy": 4,
45
- "Sad": 5,
46
- "Surprise": 6
47
- },
48
- "spk2id": {
49
- "jvnv-M2": 0
50
- }
51
- },
52
- "model": {
53
- "use_spk_conditioned_encoder": true,
54
- "use_noise_scaled_mas": true,
55
- "use_mel_posterior_encoder": false,
56
- "use_duration_discriminator": true,
57
- "inter_channels": 192,
58
- "hidden_channels": 192,
59
- "filter_channels": 768,
60
- "n_heads": 2,
61
- "n_layers": 6,
62
- "kernel_size": 3,
63
- "p_dropout": 0.1,
64
- "resblock": "1",
65
- "resblock_kernel_sizes": [3, 7, 11],
66
- "resblock_dilation_sizes": [
67
- [1, 3, 5],
68
- [1, 3, 5],
69
- [1, 3, 5]
70
- ],
71
- "upsample_rates": [8, 8, 2, 2, 2],
72
- "upsample_initial_channel": 512,
73
- "upsample_kernel_sizes": [16, 16, 8, 2, 2],
74
- "n_layers_q": 3,
75
- "use_spectral_norm": false,
76
- "gin_channels": 256
77
- },
78
- "version": "1.2"
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
model_assets/jvnv-M2/jvnv-M2.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fcc35ddfddc94234c5d3f30d3c5c865c66b0ba2ad12ed2a13afd2c4878119e2
3
- size 198768188
 
 
 
 
model_assets/jvnv-M2/style_vectors.npy DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c965bb63fa4a759d41a8a4a3649333125d6497ae8a705d81b7d5c5bd2854797c
3
- size 7296