bsrnn-vocals / hparams.yaml
crlandsc's picture
uploaded vocals model
bcb1f8a
raw
history blame
3.67 kB
model:
sr: 44100
n_fft: 2048
bandsplits:
- - 1000
- 100
- - 4000
- 250
- - 8000
- 500
- - 16000
- 1000
- - 20000
- 2000
bottleneck_layer: rnn
t_timesteps: 263
fc_dim: 128
rnn_dim: 256
rnn_type: LSTM
bidirectional: true
num_layers: 12
mlp_dim: 512
return_mask: false
complex_as_channel: true
is_mono: false
train_dataset:
file_dir: /home/crlandsc/Music-Demixing-with-Band-Split-RNN/datasets/Vocals
txt_dir: files/
txt_path: null
target: vocals
is_training: true
is_mono: false
sr: 44100
preload_dataset: false
silent_prob: 0.1
mix_prob: 0.25
mix_tgt_too: false
test_dataset:
in_fp: /home/crlandsc/Music-Demixing-with-Band-Split-RNN/datasets/Vocals
target: vocals
is_mono: false
sr: 44100
win_size: 3
hop_size: 0.5
batch_size: 4
window: null
sad:
sr: 44100
window_size_in_sec: 6
overlap_ratio: 0.5
n_chunks_per_segment: 10
eps: 1.0e-05
gamma: 0.001
threshold_max_quantile: 0.15
threshold_segment: 0.5
augmentations:
randomcrop:
_target_: data.augmentations.RandomCrop
p: 1
chunk_size_sec: 3
sr: 44100
window_stft: 2048
hop_stft: 512
gainscale:
_target_: data.augmentations.GainScale
p: 0.5
min_db: -10.0
max_db: 10.0
featurizer:
direct_transform:
_target_: torchaudio.transforms.Spectrogram
n_fft: 2048
win_length: 2048
hop_length: 512
power: null
inverse_transform:
_target_: torchaudio.transforms.InverseSpectrogram
n_fft: 2048
win_length: 2048
hop_length: 512
callbacks:
lr_monitor:
_target_: pytorch_lightning.callbacks.LearningRateMonitor
logging_interval: epoch
model_ckpt:
_target_: pytorch_lightning.callbacks.ModelCheckpoint
monitor: train/loss
mode: min
save_top_k: 4
dirpath: /home/crlandsc/Music-Demixing-with-Band-Split-RNN/src/logs/bandsplitrnn/2023-04-28_17-51/weights
filename: epoch{epoch:02d}-train_loss{train/loss:.2f}
auto_insert_metric_name: false
model_ckpt_usdr:
_target_: pytorch_lightning.callbacks.ModelCheckpoint
monitor: train/usdr
mode: max
save_top_k: 4
dirpath: /home/crlandsc/Music-Demixing-with-Band-Split-RNN/src/logs/bandsplitrnn/2023-04-28_17-51/weights
filename: epoch{epoch:02d}-train_usdr{train/usdr:.2f}
auto_insert_metric_name: false
ema:
_target_: utils.callbacks.EMA
decay: 0.9999
validate_original_weights: false
every_n_steps: 1
logger:
tensorboard:
_target_: pytorch_lightning.loggers.TensorBoardLogger
save_dir: /home/crlandsc/Music-Demixing-with-Band-Split-RNN/src/logs/bandsplitrnn/2023-04-28_17-51/tb_logs
name: ''
version: ''
log_graph: false
default_hp_metric: false
prefix: ''
wandb:
_target_: pytorch_lightning.loggers.WandbLogger
project: MDX_BSRNN_23
name: vocals
save_dir: wandb_logs
offline: false
id: null
log_model: false
prefix: ''
job_type: train
group: ''
tags: []
train_loader:
batch_size: 8
num_workers: 12
shuffle: true
drop_last: true
val_loader:
batch_size: 2
num_workers: 8
shuffle: false
drop_last: false
opt:
_target_: torch.optim.Adam
lr: 0.001
sch:
warmup_step: 10
alpha: 0.1
gamma: 0.9899494936611665
ckpt_path: logs/bandsplitrnn/2023-04-28_14-12/weights/epoch217-train_usdr7.07.ckpt
trainer:
fast_dev_run: false
min_epochs: 100
max_epochs: 500
log_every_n_steps: 10
accelerator: auto
devices: auto
gradient_clip_val: 5
precision: 32
enable_progress_bar: true
benchmark: true
deterministic: false
experiment_dirname: bandsplitrnn
wandb_api_key: d5c4447e39b2b10b95f05f907d57845ded16bc13