Politrees commited on
Commit
491e44c
·
verified ·
1 Parent(s): 246dc71

Upload 62 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. Bandit_models/checkpoint-multi_fixed.ckpt +3 -0
  2. Bandit_models/config_dnr_bandit_bsrnn_multi_mus64.yaml +78 -0
  3. Bandit_models/config_dnr_bandit_v2_mus64.yaml +78 -0
  4. Bandit_models/model_bandit_plus_dnr_sdr_11.47.ckpt +3 -0
  5. MDX23C_models/MDX23C-8KFFT-InstVoc_HQ.ckpt +3 -0
  6. MDX23C_models/MDX23C-8KFFT-InstVoc_HQ_2.ckpt +3 -0
  7. MDX23C_models/MDX23C-De-Reverb-aufr33-jarredou.ckpt +3 -0
  8. MDX23C_models/MDX23C-DrumSep-aufr33-jarredou.ckpt +3 -0
  9. MDX23C_models/MDX23C_D1581.ckpt +3 -0
  10. MDX23C_models/config_dereverb_mdx23c.yaml +135 -0
  11. MDX23C_models/config_drumsep_mdx23c.yaml +87 -0
  12. MDX23C_models/config_mdx23c_similarity.yaml +47 -0
  13. MDX23C_models/model_2_stem_061321.yaml +36 -0
  14. MDX23C_models/model_2_stem_full_band_8k.yaml +43 -0
  15. MDX23C_models/model_mdx23c_ep_271_l1_freq_72.2383.ckpt +3 -0
  16. MDXNet_models/Kim_Inst.onnx +3 -0
  17. MDXNet_models/Kim_Vocal_1.onnx +3 -0
  18. MDXNet_models/Kim_Vocal_2.onnx +3 -0
  19. MDXNet_models/Reverb_HQ_By_FoxJoy.onnx +3 -0
  20. MDXNet_models/UVR-MDX-NET-Inst_1.onnx +3 -0
  21. MDXNet_models/UVR-MDX-NET-Inst_2.onnx +3 -0
  22. MDXNet_models/UVR-MDX-NET-Inst_3.onnx +3 -0
  23. MDXNet_models/UVR-MDX-NET-Inst_HQ_1.onnx +3 -0
  24. MDXNet_models/UVR-MDX-NET-Inst_HQ_2.onnx +3 -0
  25. MDXNet_models/UVR-MDX-NET-Inst_HQ_3.onnx +3 -0
  26. MDXNet_models/UVR-MDX-NET-Inst_HQ_4.onnx +3 -0
  27. MDXNet_models/UVR-MDX-NET-Inst_HQ_5.onnx +3 -0
  28. MDXNet_models/UVR-MDX-NET-Inst_Main.onnx +3 -0
  29. MDXNet_models/UVR-MDX-NET-Inst_full_292.onnx +3 -0
  30. MDXNet_models/UVR-MDX-NET-Voc_FT.onnx +3 -0
  31. MDXNet_models/UVR-MDX-NET_Crowd_HQ_1.onnx +3 -0
  32. MDXNet_models/UVR-MDX-NET_Inst_187_beta.onnx +3 -0
  33. MDXNet_models/UVR-MDX-NET_Inst_82_beta.onnx +3 -0
  34. MDXNet_models/UVR-MDX-NET_Inst_90_beta.onnx +3 -0
  35. MDXNet_models/UVR-MDX-NET_Main_340.onnx +3 -0
  36. MDXNet_models/UVR-MDX-NET_Main_390.onnx +3 -0
  37. MDXNet_models/UVR-MDX-NET_Main_406.onnx +3 -0
  38. MDXNet_models/UVR-MDX-NET_Main_427.onnx +3 -0
  39. MDXNet_models/UVR-MDX-NET_Main_438.onnx +3 -0
  40. MDXNet_models/UVR_MDXNET_1_9703.onnx +3 -0
  41. MDXNet_models/UVR_MDXNET_2_9682.onnx +3 -0
  42. MDXNet_models/UVR_MDXNET_3_9662.onnx +3 -0
  43. MDXNet_models/UVR_MDXNET_9482.onnx +3 -0
  44. MDXNet_models/UVR_MDXNET_KARA.onnx +3 -0
  45. MDXNet_models/UVR_MDXNET_KARA_2.onnx +3 -0
  46. MDXNet_models/UVR_MDXNET_Main.onnx +3 -0
  47. MDXNet_models/kuielab_a_bass.onnx +3 -0
  48. MDXNet_models/kuielab_a_drums.onnx +3 -0
  49. MDXNet_models/kuielab_a_other.onnx +3 -0
  50. MDXNet_models/kuielab_a_vocals.onnx +3 -0
Bandit_models/checkpoint-multi_fixed.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20bcd513dc7eb0541dd045909a4e7dff8dab474cc2efba4904101c76524aee85
3
+ size 149133378
Bandit_models/config_dnr_bandit_bsrnn_multi_mus64.yaml ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: "MultiMaskMultiSourceBandSplitRNN"
2
+ audio:
3
+ chunk_size: 264600
4
+ num_channels: 2
5
+ sample_rate: 44100
6
+ min_mean_abs: 0.001
7
+
8
+ model:
9
+ in_channel: 1
10
+ stems: ['speech', 'music', 'effects']
11
+ band_specs: "musical"
12
+ n_bands: 64
13
+ fs: 44100
14
+ require_no_overlap: false
15
+ require_no_gap: true
16
+ normalize_channel_independently: false
17
+ treat_channel_as_feature: true
18
+ n_sqm_modules: 8
19
+ emb_dim: 128
20
+ rnn_dim: 256
21
+ bidirectional: true
22
+ rnn_type: "GRU"
23
+ mlp_dim: 512
24
+ hidden_activation: "Tanh"
25
+ hidden_activation_kwargs: null
26
+ complex_mask: true
27
+ n_fft: 2048
28
+ win_length: 2048
29
+ hop_length: 512
30
+ window_fn: "hann_window"
31
+ wkwargs: null
32
+ power: null
33
+ center: true
34
+ normalized: true
35
+ pad_mode: "constant"
36
+ onesided: true
37
+
38
+ training:
39
+ batch_size: 4
40
+ gradient_accumulation_steps: 4
41
+ grad_clip: 0
42
+ instruments:
43
+ - Speech
44
+ - Music
45
+ - Effects
46
+ lr: 9.0e-05
47
+ patience: 2
48
+ reduce_factor: 0.95
49
+ target_instrument: null
50
+ num_epochs: 1000
51
+ num_steps: 1000
52
+ q: 0.95
53
+ coarse_loss_clip: true
54
+ ema_momentum: 0.999
55
+ optimizer: adam
56
+ other_fix: true # it's needed for checking on multisong dataset if other is actually instrumental
57
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
58
+
59
+ augmentations:
60
+ enable: true # enable or disable all augmentations (to fast disable if needed)
61
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
62
+ loudness_min: 0.5
63
+ loudness_max: 1.5
64
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
65
+ mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
66
+ - 0.2
67
+ - 0.02
68
+ mixup_loudness_min: 0.5
69
+ mixup_loudness_max: 1.5
70
+ all:
71
+ channel_shuffle: 0.5 # Set 0 or lower to disable
72
+ random_inverse: 0.1 # inverse track (better lower probability)
73
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
74
+
75
+ inference:
76
+ batch_size: 1
77
+ dim_t: 256
78
+ num_overlap: 4
Bandit_models/config_dnr_bandit_v2_mus64.yaml ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ cls: Bandit
2
+
3
+ audio:
4
+ chunk_size: 384000
5
+ num_channels: 2
6
+ sample_rate: 48000
7
+ min_mean_abs: 0.000
8
+
9
+ kwargs:
10
+ in_channels: 1
11
+ stems: ['speech', 'music', 'sfx']
12
+ band_type: musical
13
+ n_bands: 64
14
+ normalize_channel_independently: false
15
+ treat_channel_as_feature: true
16
+ n_sqm_modules: 8
17
+ emb_dim: 128
18
+ rnn_dim: 256
19
+ bidirectional: true
20
+ rnn_type: "GRU"
21
+ mlp_dim: 512
22
+ hidden_activation: "Tanh"
23
+ hidden_activation_kwargs:
24
+ complex_mask: true
25
+ use_freq_weights: true
26
+ n_fft: 2048
27
+ win_length: 2048
28
+ hop_length: 512
29
+ window_fn: "hann_window"
30
+ wkwargs:
31
+ power:
32
+ center: true
33
+ normalized: true
34
+ pad_mode: "reflect"
35
+ onesided: true
36
+
37
+ training:
38
+ batch_size: 4
39
+ gradient_accumulation_steps: 4
40
+ grad_clip: 0
41
+ instruments:
42
+ - Speech
43
+ - Music
44
+ - Sfx
45
+ lr: 9.0e-05
46
+ patience: 2
47
+ reduce_factor: 0.95
48
+ target_instrument:
49
+ num_epochs: 1000
50
+ num_steps: 1000
51
+ q: 0.95
52
+ coarse_loss_clip: true
53
+ ema_momentum: 0.999
54
+ optimizer: adam
55
+ other_fix: true # it's needed for checking on multisong dataset if other is actually instrumental
56
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
57
+
58
+ augmentations:
59
+ enable: true # enable or disable all augmentations (to fast disable if needed)
60
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
61
+ loudness_min: 0.5
62
+ loudness_max: 1.5
63
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
64
+ mixup_probs: !!python/tuple
65
+ # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
66
+ - 0.2
67
+ - 0.02
68
+ mixup_loudness_min: 0.5
69
+ mixup_loudness_max: 1.5
70
+ all:
71
+ channel_shuffle: 0.5 # Set 0 or lower to disable
72
+ random_inverse: 0.1 # inverse track (better lower probability)
73
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
74
+
75
+ inference:
76
+ batch_size: 8
77
+ dim_t: 256
78
+ num_overlap: 4
Bandit_models/model_bandit_plus_dnr_sdr_11.47.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c48284779f7d1258a6527d3aaa18a532d45c1f506e2dcc25d5ab179a8c5e2573
3
+ size 148891175
MDX23C_models/MDX23C-8KFFT-InstVoc_HQ.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49d51472769e34a2501cd1da782346a3212555c3a5619fc2c53507445528d816
3
+ size 448101203
MDX23C_models/MDX23C-8KFFT-InstVoc_HQ_2.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d960d8e40a458120412c1bd807e013d2dbca7b959cc9da2bbcb0eb203d1daea
3
+ size 448093770
MDX23C_models/MDX23C-De-Reverb-aufr33-jarredou.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eae2471b707758d74db38ac1b1d5800e12f57c4e9d1ebbb2faf004b8e086e914
3
+ size 448098867
MDX23C_models/MDX23C-DrumSep-aufr33-jarredou.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2a4aa53eb584d21eead358a4e66d1882ad182911be018f052b5da73be9096d0
3
+ size 437652699
MDX23C_models/MDX23C_D1581.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7d4d2137f12764950205b095da20032fef1d41f077bacc8582f20ed40e8cb28
3
+ size 183379219
MDX23C_models/config_dereverb_mdx23c.yaml ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 128
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 128
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+
24
+ training:
25
+ batch_size: 2
26
+ gradient_accumulation_steps: 1
27
+ grad_clip: 0
28
+ instruments:
29
+ - dry
30
+ - No dry
31
+ lr: 1.0e-06
32
+ patience: 4
33
+ reduce_factor: 0.93
34
+ target_instrument: null
35
+ num_epochs: 40
36
+ num_steps: 1000
37
+ q: 0.95
38
+ coarse_loss_clip: true
39
+ ema_momentum: 0.999
40
+ optimizer: adamw
41
+ read_metadata_procs: 8 # Number of processes to use during metadata reading for dataset. Can speed up metadata generation
42
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
43
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
44
+
45
+ augmentations:
46
+ enable: false # enable or disable all augmentations (to fast disable if needed)
47
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
48
+ loudness_min: 0.5
49
+ loudness_max: 1.5
50
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
51
+ mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
52
+ - 0.2
53
+ - 0.02
54
+ mixup_loudness_min: 0.5
55
+ mixup_loudness_max: 1.5
56
+
57
+ all:
58
+ channel_shuffle: 0.5 # Set 0 or lower to disable
59
+ random_inverse: 0.05 # inverse track (better lower probability)
60
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
61
+
62
+ # pedalboard chorus block
63
+ pedalboard_chorus: 0.001
64
+ pedalboard_chorus_rate_hz_min: 1.0
65
+ pedalboard_chorus_rate_hz_max: 7.0
66
+ pedalboard_chorus_depth_min: 0.25
67
+ pedalboard_chorus_depth_max: 0.95
68
+ pedalboard_chorus_centre_delay_ms_min: 3
69
+ pedalboard_chorus_centre_delay_ms_max: 10
70
+ pedalboard_chorus_feedback_min: 0.0
71
+ pedalboard_chorus_feedback_max: 0.01
72
+ pedalboard_chorus_mix_min: 0.1
73
+ pedalboard_chorus_mix_max: 0.9
74
+
75
+ # pedalboard phazer block
76
+ pedalboard_phazer: 0.001
77
+ pedalboard_phazer_rate_hz_min: 1.0
78
+ pedalboard_phazer_rate_hz_max: 10.0
79
+ pedalboard_phazer_depth_min: 0.25
80
+ pedalboard_phazer_depth_max: 0.95
81
+ pedalboard_phazer_centre_frequency_hz_min: 200
82
+ pedalboard_phazer_centre_frequency_hz_max: 12000
83
+ pedalboard_phazer_feedback_min: 0.0
84
+ pedalboard_phazer_feedback_max: 0.5
85
+ pedalboard_phazer_mix_min: 0.1
86
+ pedalboard_phazer_mix_max: 0.9
87
+
88
+ # pedalboard pitch shift block
89
+ pedalboard_pitch_shift: 0.01
90
+ pedalboard_pitch_shift_semitones_min: -7
91
+ pedalboard_pitch_shift_semitones_max: 7
92
+
93
+ # pedalboard resample block
94
+ pedalboard_resample: 0.001
95
+ pedalboard_resample_target_sample_rate_min: 4000
96
+ pedalboard_resample_target_sample_rate_max: 44100
97
+
98
+ mp3_compression_min_bitrate: 32
99
+ mp3_compression_max_bitrate: 320
100
+ mp3_compression_backend: "lameenc"
101
+
102
+ dry:
103
+ # pedalboard distortion block
104
+ pedalboard_distortion: 0.001
105
+ pedalboard_distortion_drive_db_min: 1.0
106
+ pedalboard_distortion_drive_db_max: 25.0
107
+
108
+ tanh_distortion: 0.05
109
+ tanh_distortion_min: 0.1
110
+ tanh_distortion_max: 0.7
111
+ # pedalboard bitcrash block
112
+ pedalboard_bitcrash: 0.005
113
+ pedalboard_bitcrash_bit_depth_min: 4
114
+ pedalboard_bitcrash_bit_depth_max: 16
115
+
116
+ seven_band_parametric_eq: 0.24
117
+ seven_band_parametric_eq_min_gain_db: -9
118
+ seven_band_parametric_eq_max_gain_db: 9
119
+
120
+ gaussian_noise: 0.005
121
+ gaussian_noise_min_amplitude: 0.001
122
+ gaussian_noise_max_amplitude: 0.01
123
+
124
+ time_stretch: 0.01
125
+ time_stretch_min_rate: 0.8
126
+ time_stretch_max_rate: 1.25
127
+ other:
128
+ seven_band_parametric_eq: 0.24
129
+ seven_band_parametric_eq_min_gain_db: -9
130
+ seven_band_parametric_eq_max_gain_db: 9
131
+
132
+ inference:
133
+ batch_size: 2
134
+ dim_t: 256
135
+ num_overlap: 4
MDX23C_models/config_drumsep_mdx23c.yaml ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 130560
3
+ dim_f: 1024
4
+ dim_t: 256
5
+ hop_length: 512
6
+ n_fft: 2048
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 128
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 128
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+
24
+ training:
25
+ batch_size: 12
26
+ gradient_accumulation_steps: 1
27
+ grad_clip: 0
28
+ instruments:
29
+ - kick
30
+ - snare
31
+ - toms
32
+ - hh
33
+ - ride
34
+ - crash
35
+ lr: 9.0e-05
36
+ patience: 30
37
+ reduce_factor: 0.95
38
+ target_instrument: null
39
+ num_epochs: 1000
40
+ num_steps: 1268
41
+ q: 0.95
42
+ coarse_loss_clip: true
43
+ ema_momentum: 0.999
44
+ optimizer: adam
45
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
46
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
47
+
48
+ augmentations:
49
+ enable: true # enable or disable all augmentations (to fast disable if needed)
50
+ loudness: true # randomly change loudness of each stem on the range (loudness_min; loudness_max)
51
+ loudness_min: 0.5
52
+ loudness_max: 1.5
53
+ mixup: true # mix several stems of same type with some probability (only works for dataset types: 1, 2, 3)
54
+ mixup_probs: !!python/tuple # 2 additional stems of the same type (1st with prob 0.2, 2nd with prob 0.02)
55
+ - 0.2
56
+ - 0.02
57
+ mixup_loudness_min: 0.5
58
+ mixup_loudness_max: 1.5
59
+
60
+ # apply mp3 compression to mixture only (emulate downloading mp3 from internet)
61
+ mp3_compression_on_mixture: 0.0
62
+ mp3_compression_on_mixture_bitrate_min: 32
63
+ mp3_compression_on_mixture_bitrate_max: 320
64
+ mp3_compression_on_mixture_backend: "lameenc"
65
+
66
+ all:
67
+ channel_shuffle: 0.5 # Set 0 or lower to disable
68
+ random_inverse: 0.01 # inverse track (better lower probability)
69
+ random_polarity: 0.5 # polarity change (multiply waveform to -1)
70
+ mp3_compression: 0.0
71
+ mp3_compression_min_bitrate: 32
72
+ mp3_compression_max_bitrate: 320
73
+ mp3_compression_backend: "lameenc"
74
+ pitch_shift: 0.1
75
+ pitch_shift_min_semitones: -3
76
+ pitch_shift_max_semitones: 3
77
+ seven_band_parametric_eq: 0.5
78
+ seven_band_parametric_eq_min_gain_db: -6
79
+ seven_band_parametric_eq_max_gain_db: 6
80
+ tanh_distortion: 0.2
81
+ tanh_distortion_min: 0.1
82
+ tanh_distortion_max: 0.5
83
+
84
+ inference:
85
+ batch_size: 1
86
+ dim_t: 256
87
+ num_overlap: 4
MDX23C_models/config_mdx23c_similarity.yaml ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 130560
3
+ dim_f: 1024
4
+ dim_t: 256
5
+ hop_length: 512
6
+ n_fft: 2048
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 128
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 128
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+
24
+ training:
25
+ batch_size: 2
26
+ gradient_accumulation_steps: 3
27
+ grad_clip: 0
28
+ instruments:
29
+ - Similarity
30
+ - Difference
31
+ lr: 1.0
32
+ patience: 15
33
+ reduce_factor: 0.95
34
+ target_instrument: Similarity
35
+ num_epochs: 1000
36
+ num_steps: 2235
37
+ q: 0.95
38
+ coarse_loss_clip: true
39
+ ema_momentum: 0.999
40
+ optimizer: prodigy
41
+ other_fix: false # it's needed for checking on multisong dataset if other is actually instrumental
42
+ use_amp: true # enable or disable usage of mixed precision (float16) - usually it must be true
43
+
44
+ inference:
45
+ batch_size: 8
46
+ dim_t: 256
47
+ num_overlap: 8
MDX23C_models/model_2_stem_061321.yaml ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 2048
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 64
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ name: epoch_10.ckpt
23
+ training:
24
+ batch_size: 16
25
+ grad_clip: 0
26
+ instruments:
27
+ - Vocals
28
+ - Instrumental
29
+ lr: 5.0e-05
30
+ target_instrument: null
31
+ num_epochs: 100
32
+ num_steps: 1000
33
+ inference:
34
+ batch_size: 1
35
+ dim_t: 256
36
+ num_overlap: 8
MDX23C_models/model_2_stem_full_band_8k.yaml ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 128
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 1.0e-05
29
+ patience: 2
30
+ reduce_factor: 0.95
31
+ target_instrument: null
32
+ num_epochs: 1000
33
+ num_steps: 1000
34
+ augmentation: 1
35
+ augmentation_type: simple1
36
+ augmentation_mix: true
37
+ q: 0.95
38
+ coarse_loss_clip: true
39
+ ema_momentum: 0.999
40
+ inference:
41
+ batch_size: 1
42
+ dim_t: 256
43
+ num_overlap: 8
MDX23C_models/model_mdx23c_ep_271_l1_freq_72.2383.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1227f8d97c7436004d03e46091427393abefebcc08ce53ef30082742c4e482f7
3
+ size 437613512
MDXNet_models/Kim_Inst.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86b1940e7122fbdd2beadc65507cbff6c352d79012a8a7e60d56db98532af5f7
3
+ size 66759214
MDXNet_models/Kim_Vocal_1.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f313140ef8fecc3041881b60ecb993d985a0281a138b2fb634aa8901aebc38cb
3
+ size 66759214
MDXNet_models/Kim_Vocal_2.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce74ef3b6a6024ce44211a07be9cf8bc6d87728cc852a68ab34eb8e58cde9c8b
3
+ size 66759214
MDXNet_models/Reverb_HQ_By_FoxJoy.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:233bb5c6aaa365e568659a0a81211746fa881f8f47f82d9e864fce1f7692db80
3
+ size 66780123
MDXNet_models/UVR-MDX-NET-Inst_1.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca53f94b7a0cbb04fcfcc8f3ea5ec1ae22cd8ad044f5e673588859f83976f5e
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_2.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3a96a664d28b52db9def0a9cae9a16dbb524d8325bfe8f0ac64ac5d231456bc
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_3.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b7834e2972158d8c9864e7376e3a7d084079c80a23f38dc31c4b0a4e901a1cb
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_HQ_1.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a045c4ded87e3bf97b609ec5be7910e8a7cecec455f507227ab12b5e29f7f9
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_HQ_2.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:197f8ab296df850f961e68c595f6649acb7d9e621b5600b460f3458967299112
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_HQ_3.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:317554b07fe1ea5279a77f2b1520a41ea4b93432560c4ffd08792c30fddf9adc
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Inst_HQ_4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c4b5b9b05090fdf238f38ba5046813982d50e2a652e9cb3324ea79720c3c9c8
3
+ size 59074342
MDXNet_models/UVR-MDX-NET-Inst_HQ_5.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:811cb24095d865763752310848b7ec86aeede0626cb05749ab35350e46897000
3
+ size 59074342
MDXNet_models/UVR-MDX-NET-Inst_Main.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ab401dfe4a548b87deb64f975294bd56ff946aa32903f53b4b24bb13b2cce1e
3
+ size 52786726
MDXNet_models/UVR-MDX-NET-Inst_full_292.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020f6b65fa219fb7c285e4f3fc2863bf22daf03c4c93e547b6d13d5f2757a7ec
3
+ size 66759214
MDXNet_models/UVR-MDX-NET-Voc_FT.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:534b2070fcc7df514b13ef660dc8cbb328679c2374d04354a5c42bb14ecce111
3
+ size 66762490
MDXNet_models/UVR-MDX-NET_Crowd_HQ_1.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:313b7bf869c411fdafe005cf0d5a635c405cb3d0df137178a64091952d75225c
3
+ size 59074342
MDXNet_models/UVR-MDX-NET_Inst_187_beta.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c74566f3c3033cacba996328b2ee90bf77ef79ea6c35b7841df183b7906f54a5
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Inst_82_beta.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6c268302f09ab53687072618e056a611272a7e2c3fd9b3b59164da152f3588e
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Inst_90_beta.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d902868a46575aea6ee2335736ff3b53faf497a6bdaa1b864e0fd84eb1b42a5
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Main_340.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78792633b4007755af12ecde20f709b4f0b99563b1d25fe0a501ed2122aff218
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Main_390.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:286c4f0847ca837e2c3f4c4058f756d5f150cbf080506aa6f33a2847aba92e8c
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Main_406.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f158816a44eef1f0ba0f48b813cbfcf460ed1c70a754af3609ade44aaf7d1b23
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Main_427.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95275802a27801b97e3c0552b6eaa69f9bb3bd7df53cdf0536cce0a753f702cc
3
+ size 66759214
MDXNet_models/UVR-MDX-NET_Main_438.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5e1ad93587a163a0987a0168b99a2ad875c0d9bfc3afb596b7c36b09c7f5c26
3
+ size 66759214
MDXNet_models/UVR_MDXNET_1_9703.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:229ad3bb96a037e89d8ed86732d6d3675856e6a07c3e3f02896eac01ec7ee4be
3
+ size 29704436
MDXNet_models/UVR_MDXNET_2_9682.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1deb7295acd3206bc9582a5d92f1b0a74bf3f41c7c1fb78a0ac0123cde4372db
3
+ size 29704436
MDXNet_models/UVR_MDXNET_3_9662.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e02220e80d8253f4c2209f8924298b2b686bbdf2868b788ff5500fb9bd94aadc
3
+ size 29704436
MDXNet_models/UVR_MDXNET_9482.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4f365207c56deb115bceedff3ad8fe98a751c745f9e370cecec6226b8b47184
3
+ size 29704436
MDXNet_models/UVR_MDXNET_KARA.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3167c87333a48548413e972a286bf40bf5694001d2853861eb1435953f02d63
3
+ size 29704436
MDXNet_models/UVR_MDXNET_KARA_2.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf32e15105a09c0f7dddd2b67346146334d6f3ecb399ed7638eba2ab07cbf5f4
3
+ size 52786726
MDXNet_models/UVR_MDXNET_Main.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8289784cda38543ff431add4070662813311a8cccfc0112ca82f76d9dba2b4ca
3
+ size 66759214
MDXNet_models/kuielab_a_bass.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c3e77b9963185b1ea6bb46a4b8924137d9370fc1ccdefec7b1b416ef550dcaa
3
+ size 29703204
MDXNet_models/kuielab_a_drums.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f586b7091934dd6f5563f0cba8f14bad57ce88440da1098bf388ea716c2901
3
+ size 29703204
MDXNet_models/kuielab_a_other.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b67a1dcb5f232153528c59960b4c7bf8dc736b8114de360af0e719633f53358
3
+ size 29703204
MDXNet_models/kuielab_a_vocals.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daba83c2ee1afee9139766ad64c9b6808d6b6f092fff04bed3338be50baac721
3
+ size 29703204