Spaces:
Build error
Build error
K_step: 1000 | |
accumulate_grad_batches: 1 | |
audio_num_mel_bins: 128 | |
audio_sample_rate: 44100 | |
binarization_args: | |
shuffle: false | |
with_align: true | |
with_f0: true | |
with_hubert: true | |
with_spk_embed: false | |
with_wav: false | |
binarizer_cls: preprocessing.SVCpre.SVCBinarizer | |
binary_data_dir: data/binary/aquapre | |
check_val_every_n_epoch: 10 | |
choose_test_manually: false | |
clip_grad_norm: 1 | |
config_path: F:\diff-svc-main\training\config_nsf.yaml | |
content_cond_steps: [] | |
cwt_add_f0_loss: false | |
cwt_hidden_size: 128 | |
cwt_layers: 2 | |
cwt_loss: l1 | |
cwt_std_scale: 0.8 | |
datasets: | |
- opencpop | |
debug: false | |
dec_ffn_kernel_size: 9 | |
dec_layers: 4 | |
decay_steps: 20000 | |
decoder_type: fft | |
dict_dir: '' | |
diff_decoder_type: wavenet | |
diff_loss_type: l2 | |
dilation_cycle_length: 4 | |
dropout: 0.1 | |
ds_workers: 4 | |
dur_enc_hidden_stride_kernel: | |
- 0,2,3 | |
- 0,2,3 | |
- 0,1,3 | |
dur_loss: mse | |
dur_predictor_kernel: 3 | |
dur_predictor_layers: 5 | |
enc_ffn_kernel_size: 9 | |
enc_layers: 4 | |
encoder_K: 8 | |
encoder_type: fft | |
endless_ds: false | |
f0_bin: 256 | |
f0_max: 1100.0 | |
f0_min: 40.0 | |
f0_static: '{"28.0": 0.07, "29.0": 0.03, "31.0": 0.05, "32.0": 0.08, "33.0": 0.12, | |
"34.0": 0.02, "35.0": 0.06, "36.0": 0.02, "37.0": 0.01, "38.0": 0.1, "39.0": 0.05, | |
"40.0": 0.09, "41.0": 0.14, "42.0": 0.16, "43.0": 0.03, "44.0": 0.42, "45.0": 0.74, | |
"46.0": 1.13, "47.0": 1.49, "48.0": 1.76, "49.0": 2.59, "50.0": 3.03, "51.0": 2.71, | |
"52.0": 1.93, "53.0": 1.11, "54.0": 0.78, "55.0": 3.33, "56.0": 20.38, "57.0": 69.6, | |
"58.0": 167.04, "59.0": 245.1, "60.0": 318.87, "61.0": 373.41, "62.0": 434.86, "63.0": | |
415.63, "64.0": 448.97, "65.0": 452.99, "66.0": 474.88, "67.0": 471.54, "68.0": | |
455.78, "69.0": 421.71, "70.0": 372.06, "71.0": 323.85, "72.0": 292.8, "73.0": 238.94, | |
"74.0": 190.5, "75.0": 132.86, "76.0": 88.03, "77.0": 53.16, "78.0": 32.96, "79.0": | |
23.66, "80.0": 14.74, "81.0": 8.54, "82.0": 5.0, "83.0": 3.32, "84.0": 2.29, "85.0": | |
0.91, "total_time": 6576.43}' | |
ffn_act: gelu | |
ffn_padding: SAME | |
fft_size: 2048 | |
fmax: 16000 | |
fmin: 40 | |
fs2_ckpt: '' | |
gaussian_start: true | |
gen_dir_name: '' | |
gen_tgt_spk_id: -1 | |
hidden_size: 256 | |
hop_size: 512 | |
hubert_gpu: false | |
hubert_path: checkpoints/hubert/hubert_soft.pt | |
infer: false | |
keep_bins: 128 | |
lambda_commit: 0.25 | |
lambda_energy: 0.0 | |
lambda_f0: 1.0 | |
lambda_ph_dur: 0.3 | |
lambda_sent_dur: 1.0 | |
lambda_uv: 1.0 | |
lambda_word_dur: 1.0 | |
load_ckpt: '' | |
log_interval: 100 | |
loud_norm: false | |
lr: 0.0008 | |
max_beta: 0.02 | |
max_epochs: 3000 | |
max_eval_sentences: 1 | |
max_eval_tokens: 60000 | |
max_frames: 42000 | |
max_input_tokens: 6000 | |
max_sentences: 88 | |
max_tokens: 128000 | |
max_updates: 1000000 | |
mel_loss: ssim:0.5|l1:0.5 | |
mel_vmax: 1.5 | |
mel_vmin: -6.0 | |
min_level_db: -120 | |
no_fs2: true | |
norm_type: gn | |
num_ckpt_keep: 10 | |
num_heads: 2 | |
num_sanity_val_steps: 1 | |
num_spk: 1 | |
num_test_samples: 0 | |
num_valid_plots: 10 | |
optimizer_adam_beta1: 0.9 | |
optimizer_adam_beta2: 0.98 | |
out_wav_norm: false | |
pe_ckpt: checkpoints/0102_xiaoma_pe/model_ckpt_steps_60000.ckpt | |
pe_enable: false | |
perform_enhance: true | |
pitch_ar: false | |
pitch_enc_hidden_stride_kernel: | |
- 0,2,5 | |
- 0,2,5 | |
- 0,2,5 | |
pitch_extractor: parselmouth | |
pitch_loss: l2 | |
pitch_norm: log | |
pitch_type: frame | |
pndm_speedup: 10 | |
pre_align_args: | |
allow_no_txt: false | |
denoise: false | |
forced_align: mfa | |
txt_processor: zh_g2pM | |
use_sox: true | |
use_tone: false | |
pre_align_cls: data_gen.singing.pre_align.SingingPreAlign | |
predictor_dropout: 0.5 | |
predictor_grad: 0.1 | |
predictor_hidden: -1 | |
predictor_kernel: 5 | |
predictor_layers: 5 | |
prenet_dropout: 0.5 | |
prenet_hidden_size: 256 | |
pretrain_fs_ckpt: '' | |
processed_data_dir: xxx | |
profile_infer: false | |
raw_data_dir: data/raw/aquapre | |
ref_norm_layer: bn | |
rel_pos: true | |
reset_phone_dict: true | |
residual_channels: 512 | |
residual_layers: 20 | |
save_best: false | |
save_ckpt: true | |
save_codes: | |
- configs | |
- modules | |
- src | |
- utils | |
save_f0: true | |
save_gt: false | |
schedule_type: linear | |
seed: 1234 | |
sort_by_len: true | |
speaker_id: aqua | |
spec_max: | |
- 0.18377557396888733 | |
- -0.33469653129577637 | |
- -0.3073468506336212 | |
- -0.21027648448944092 | |
- 0.23178215324878693 | |
- 0.5297451019287109 | |
- 0.7021887898445129 | |
- 0.7711099982261658 | |
- 0.7912386059761047 | |
- 0.6609739065170288 | |
- 0.649876058101654 | |
- 0.6327046751976013 | |
- 0.6892049908638 | |
- 0.6026111841201782 | |
- 0.6834777593612671 | |
- 0.7417489886283875 | |
- 0.6040375828742981 | |
- 0.5854794383049011 | |
- 0.7123280167579651 | |
- 0.5886657238006592 | |
- 0.6135984063148499 | |
- 0.5388530492782593 | |
- 0.5932422280311584 | |
- 0.535581111907959 | |
- 0.57913738489151 | |
- 0.6827316880226135 | |
- 0.6265526413917542 | |
- 0.6557696461677551 | |
- 0.6586976647377014 | |
- 0.5687282085418701 | |
- 0.6218562722206116 | |
- 0.6349128484725952 | |
- 0.6176865100860596 | |
- 0.6212958097457886 | |
- 0.6277656555175781 | |
- 0.5551338195800781 | |
- 0.6126622557640076 | |
- 0.5821346640586853 | |
- 0.577056348323822 | |
- 0.5649800300598145 | |
- 0.5984634757041931 | |
- 0.4873456656932831 | |
- 0.47209471464157104 | |
- 0.4387756586074829 | |
- 0.4690910577774048 | |
- 0.4616055190563202 | |
- 0.3555675446987152 | |
- 0.3898852467536926 | |
- 0.3676068186759949 | |
- 0.4632047414779663 | |
- 0.37983986735343933 | |
- 0.3877682685852051 | |
- 0.3099276125431061 | |
- 0.3261813223361969 | |
- 0.34168118238449097 | |
- 0.3004901111125946 | |
- 0.3512653112411499 | |
- 0.2647061347961426 | |
- 0.2685043215751648 | |
- 0.20390087366104126 | |
- 0.1825377196073532 | |
- 0.22067485749721527 | |
- 0.20306138694286346 | |
- 0.12710601091384888 | |
- 0.10927848517894745 | |
- 0.1117628887295723 | |
- 0.14148156344890594 | |
- 0.122605100274086 | |
- 0.08032718300819397 | |
- 0.12159623205661774 | |
- -0.04923255369067192 | |
- -0.07824847847223282 | |
- 0.03441360592842102 | |
- 0.07093964517116547 | |
- -0.1269683688879013 | |
- 0.0027632638812065125 | |
- -0.045093610882759094 | |
- -0.04115259647369385 | |
- 0.029067598283290863 | |
- -0.009453626349568367 | |
- -0.0470033697783947 | |
- -0.04894810542464256 | |
- -0.06236470118165016 | |
- -0.20086997747421265 | |
- -0.2363593578338623 | |
- -0.17289961874485016 | |
- -0.219277486205101 | |
- -0.2934815585613251 | |
- -0.30551621317863464 | |
- -0.2513120770454407 | |
- -0.26792851090431213 | |
- -0.33068278431892395 | |
- -0.37532031536102295 | |
- -0.365634560585022 | |
- -0.3379015326499939 | |
- -0.26979681849479675 | |
- -0.20316314697265625 | |
- -0.2109878957271576 | |
- -0.16927000880241394 | |
- -0.1698305308818817 | |
- -0.2739156186580658 | |
- -0.2700604200363159 | |
- -0.32284122705459595 | |
- -0.44529229402542114 | |
- -0.4002469480037689 | |
- -0.2441970407962799 | |
- -0.19795942306518555 | |
- -0.2462945580482483 | |
- -0.0673084482550621 | |
- -0.22117790579795837 | |
- -0.21418607234954834 | |
- -0.39467209577560425 | |
- -0.4388139843940735 | |
- -0.3227368891239166 | |
- -0.30530503392219543 | |
- -0.3201104998588562 | |
- -0.39839836955070496 | |
- -0.464596688747406 | |
- -0.5399728417396545 | |
- -0.5515261292457581 | |
- -0.520453691482544 | |
- -0.6714966893196106 | |
- -0.6414765119552612 | |
- -0.6108742356300354 | |
- -0.6762520670890808 | |
- -0.7067146301269531 | |
- -0.7586700320243835 | |
- -0.6640384793281555 | |
spec_min: | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.999994277954102 | |
- -4.989471912384033 | |
- -4.999994277954102 | |
spk_cond_steps: [] | |
stop_token_weight: 5.0 | |
task_cls: training.task.SVC_task.SVCTask | |
test_ids: [] | |
test_input_dir: '' | |
test_num: 0 | |
test_prefixes: | |
- test | |
test_set_name: test | |
timesteps: 1000 | |
train_set_name: train | |
use_cn_hubert: false | |
use_crepe: true | |
use_denoise: false | |
use_energy_embed: false | |
use_gt_dur: false | |
use_gt_f0: false | |
use_midi: false | |
use_nsf: true | |
use_pitch_embed: true | |
use_pos_embed: true | |
use_spk_embed: false | |
use_spk_id: false | |
use_split_spk_id: false | |
use_uv: false | |
use_var_enc: false | |
use_vec: false | |
val_check_interval: 2000 | |
valid_num: 0 | |
valid_set_name: valid | |
vocoder: network.vocoders.nsf_hifigan.NsfHifiGAN | |
vocoder_ckpt: checkpoints/nsf_hifigan/model | |
warmup_updates: 2000 | |
wav2spec_eps: 1e-6 | |
weight_decay: 0 | |
win_size: 2048 | |
work_dir: checkpoints/aquapre | |