Sucial commited on
Commit
6e18dc2
1 Parent(s): b486b15

Upload 3 files

Browse files
Files changed (3) hide show
  1. config.yaml +84 -0
  2. model_steps_64000_simplified.ckpt +3 -0
  3. rmvpe.pt +3 -0
config.yaml ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accumulate_grad_batches: 1
2
+ audio_sample_rate: 44100
3
+ binarization_args:
4
+ num_workers: 0
5
+ shuffle: true
6
+ binarizer_cls: preprocessing.MIDIExtractionBinarizer
7
+ binary_data_dir: data/some_ds_fixmel_spk3_aug8/binary
8
+ clip_grad_norm: 1
9
+ dataloader_prefetch_factor: 2
10
+ ddp_backend: nccl
11
+ ds_workers: 4
12
+ finetune_ckpt_path: null
13
+ finetune_enabled: false
14
+ finetune_ignored_params: []
15
+ finetune_strict_shapes: true
16
+ fmax: 8000
17
+ fmin: 40
18
+ freezing_enabled: false
19
+ frozen_params: []
20
+ hop_size: 512
21
+ log_interval: 100
22
+ lr_scheduler_args:
23
+ min_lr: 1.0e-05
24
+ scheduler_cls: lr_scheduler.scheduler.WarmupLR
25
+ warmup_steps: 5000
26
+ max_batch_frames: 80000
27
+ max_batch_size: 8
28
+ max_updates: 10000000
29
+ max_val_batch_frames: 10000
30
+ max_val_batch_size: 1
31
+ midi_extractor_args:
32
+ attention_drop: 0.1
33
+ attention_heads: 8
34
+ attention_heads_dim: 64
35
+ conv_drop: 0.1
36
+ dim: 512
37
+ ffn_latent_drop: 0.1
38
+ ffn_out_drop: 0.1
39
+ kernel_size: 31
40
+ lay: 8
41
+ use_lay_skip: true
42
+ midi_max: 128
43
+ midi_min: 0
44
+ midi_num_bins: 256
45
+ midi_prob_deviation: 0.5
46
+ midi_shift_proportion: 0.0
47
+ midi_shift_range:
48
+ - -6
49
+ - 6
50
+ model_cls: modules.model.Gmidi_conform.midi_conforms
51
+ num_ckpt_keep: 5
52
+ num_sanity_val_steps: 1
53
+ num_valid_plots: 300
54
+ optimizer_args:
55
+ beta1: 0.9
56
+ beta2: 0.98
57
+ lr: 0.0001
58
+ optimizer_cls: torch.optim.AdamW
59
+ weight_decay: 0
60
+ pe: rmvpe
61
+ pe_ckpt: tools/SOME_weights/rmvpe.pt
62
+ permanent_ckpt_interval: 40000
63
+ permanent_ckpt_start: 200000
64
+ pl_trainer_accelerator: auto
65
+ pl_trainer_devices: auto
66
+ pl_trainer_num_nodes: 1
67
+ pl_trainer_precision: 32-true
68
+ pl_trainer_strategy: auto
69
+ raw_data_dir: []
70
+ rest_threshold: 0.1
71
+ sampler_frame_count_grid: 6
72
+ seed: 114514
73
+ sort_by_len: true
74
+ task_cls: training.MIDIExtractionTask
75
+ test_prefixes: null
76
+ train_set_name: train
77
+ units_dim: 80
78
+ units_encoder: mel
79
+ units_encoder_ckpt: pretrained/contentvec/checkpoint_best_legacy_500.pt
80
+ use_buond_loss: true
81
+ use_midi_loss: true
82
+ val_check_interval: 4000
83
+ valid_set_name: valid
84
+ win_size: 2048
model_steps_64000_simplified.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a246c7063ec2856097004dcefa2093a8b6ccff7a6cde1cd49e8f3f227ede50e
3
+ size 471060793
rmvpe.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19dc1809cf4cdb0a18db93441816bc327e14e5644b72eeaae5220560c6736fe2
3
+ size 368492925