File size: 1,108 Bytes
8c92a11 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 |
{
"base_config": "egs/vocoder/gan/exp_config_base.json",
"preprocess": {
// acoustic features
"extract_mel": true,
"extract_audio": true,
// Features used for model training
"use_mel": true,
"use_audio": true
},
"model": {
"generator": "bigvgan",
"bigvgan": {
"resblock": "1",
"activation": "snakebeta",
"snake_logscale": true,
"upsample_rates": [
4,
4,
2,
2,
2,
2
],
"upsample_kernel_sizes": [
8,
8,
4,
4,
4,
4
],
"upsample_initial_channel": 1536,
"resblock_kernel_sizes": [
3,
7,
11
],
"resblock_dilation_sizes": [
[
1,
3,
5
],
[
1,
3,
5
],
[
1,
3,
5
]
]
},
},
"train": {
"criterions": [
"feature",
"discriminator",
"generator",
"mel",
]
},
"inference": {
"batch_size": 1,
}
}
|