ShiromiyaGamer commited on
Commit
c3d98d9
1 Parent(s): e60af07

Upload 2 files

Browse files
mdx23c-dereverb/config_dereverb_mdx23c.yaml ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 128
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 128
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+
24
+ training:
25
+ batch_size: 2
26
+ gradient_accumulation_steps: 1
27
+ grad_clip: 0
28
+ instruments:
29
+ - dry
30
+ - other
31
+ lr: 1.0e-06
32
+ patience: 4
33
+ reduce_factor: 0.93
34
+ target_instrument: null
35
+ num_epochs: 40
36
+ num_steps: 1000
37
+ q: 0.95
38
+ coarse_loss_clip: true
39
+ ema_momentum: 0.999
40
+ optimizer: adamw
41
+ read_metadata_procs: 8 # Number of processes to use during metadata reading for dataset. Can speed up metadata generation
42
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
43
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
44
+
45
+ augmentations:
46
+ enable: false # enable or disable all augmentations (to fast disable if needed)
47
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
48
+ loudness_min: 0.5
49
+ loudness_max: 1.5
50
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
51
+ mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
52
+ - 0.2
53
+ - 0.02
54
+ mixup_loudness_min: 0.5
55
+ mixup_loudness_max: 1.5
56
+
57
+ all:
58
+ channel_shuffle: 0.5 # Set 0 or lower to disable
59
+ random_inverse: 0.05 # inverse track (better lower probability)
60
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
61
+
62
+ # pedalboard chorus block
63
+ pedalboard_chorus: 0.001
64
+ pedalboard_chorus_rate_hz_min: 1.0
65
+ pedalboard_chorus_rate_hz_max: 7.0
66
+ pedalboard_chorus_depth_min: 0.25
67
+ pedalboard_chorus_depth_max: 0.95
68
+ pedalboard_chorus_centre_delay_ms_min: 3
69
+ pedalboard_chorus_centre_delay_ms_max: 10
70
+ pedalboard_chorus_feedback_min: 0.0
71
+ pedalboard_chorus_feedback_max: 0.01
72
+ pedalboard_chorus_mix_min: 0.1
73
+ pedalboard_chorus_mix_max: 0.9
74
+
75
+ # pedalboard phazer block
76
+ pedalboard_phazer: 0.001
77
+ pedalboard_phazer_rate_hz_min: 1.0
78
+ pedalboard_phazer_rate_hz_max: 10.0
79
+ pedalboard_phazer_depth_min: 0.25
80
+ pedalboard_phazer_depth_max: 0.95
81
+ pedalboard_phazer_centre_frequency_hz_min: 200
82
+ pedalboard_phazer_centre_frequency_hz_max: 12000
83
+ pedalboard_phazer_feedback_min: 0.0
84
+ pedalboard_phazer_feedback_max: 0.5
85
+ pedalboard_phazer_mix_min: 0.1
86
+ pedalboard_phazer_mix_max: 0.9
87
+
88
+ # pedalboard pitch shift block
89
+ pedalboard_pitch_shift: 0.01
90
+ pedalboard_pitch_shift_semitones_min: -7
91
+ pedalboard_pitch_shift_semitones_max: 7
92
+
93
+ # pedalboard resample block
94
+ pedalboard_resample: 0.001
95
+ pedalboard_resample_target_sample_rate_min: 4000
96
+ pedalboard_resample_target_sample_rate_max: 44100
97
+
98
+ mp3_compression_min_bitrate: 32
99
+ mp3_compression_max_bitrate: 320
100
+ mp3_compression_backend: "lameenc"
101
+
102
+ dry:
103
+ # pedalboard distortion block
104
+ pedalboard_distortion: 0.001
105
+ pedalboard_distortion_drive_db_min: 1.0
106
+ pedalboard_distortion_drive_db_max: 25.0
107
+
108
+ tanh_distortion: 0.05
109
+ tanh_distortion_min: 0.1
110
+ tanh_distortion_max: 0.7
111
+ # pedalboard bitcrash block
112
+ pedalboard_bitcrash: 0.005
113
+ pedalboard_bitcrash_bit_depth_min: 4
114
+ pedalboard_bitcrash_bit_depth_max: 16
115
+
116
+ seven_band_parametric_eq: 0.24
117
+ seven_band_parametric_eq_min_gain_db: -9
118
+ seven_band_parametric_eq_max_gain_db: 9
119
+
120
+ gaussian_noise: 0.005
121
+ gaussian_noise_min_amplitude: 0.001
122
+ gaussian_noise_max_amplitude: 0.01
123
+
124
+ time_stretch: 0.01
125
+ time_stretch_min_rate: 0.8
126
+ time_stretch_max_rate: 1.25
127
+ other:
128
+ seven_band_parametric_eq: 0.24
129
+ seven_band_parametric_eq_min_gain_db: -9
130
+ seven_band_parametric_eq_max_gain_db: 9
131
+
132
+ inference:
133
+ batch_size: 2
134
+ dim_t: 256
135
+ num_overlap: 4
mdx23c-dereverb/dereverb_mdx23c_sdr_6.9096.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eae2471b707758d74db38ac1b1d5800e12f57c4e9d1ebbb2faf004b8e086e914
3
+ size 448098867