QQSong commited on
Commit
bf1ab5f
·
verified ·
1 Parent(s): 044a0ea

Upload 14 files

Browse files
MDX_Net_Models/model_data/mdx_c_configs/model1.yaml ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 4096
4
+ dim_t: 128
5
+ hop_length: 2048
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ model:
10
+ act: gelu
11
+ bottleneck_factor: 4
12
+ growth: 64
13
+ norm: InstanceNorm
14
+ num_blocks_per_scale: 2
15
+ num_channels: 128
16
+ num_scales: 5
17
+ num_subbands: 4
18
+ scale:
19
+ - 2
20
+ - 2
21
+ training:
22
+ batch_size: 8
23
+ grad_clip: 0
24
+ instruments:
25
+ - Vocals
26
+ - Drums
27
+ - Bass
28
+ - Other
29
+ lr: 5.0e-05
30
+ target_instrument: null
31
+ inference:
32
+ batch_size: 1
33
+ dim_t: 256
34
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model2.yaml ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 4096
4
+ dim_t: 128
5
+ hop_length: 2048
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ model:
10
+ act: gelu
11
+ bottleneck_factor: 4
12
+ growth: 64
13
+ norm: InstanceNorm
14
+ num_blocks_per_scale: 2
15
+ num_channels: 256
16
+ num_scales: 5
17
+ num_subbands: 4
18
+ scale:
19
+ - 2
20
+ - 2
21
+ training:
22
+ batch_size: 8
23
+ grad_clip: 0
24
+ instruments:
25
+ - Vocals
26
+ - Drums
27
+ - Bass
28
+ - Other
29
+ lr: 3.0e-05
30
+ target_instrument: null
31
+ inference:
32
+ batch_size: 1
33
+ dim_t: 256
34
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model3.yaml ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 4096
4
+ dim_t: 128
5
+ hop_length: 2048
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ model:
10
+ act: gelu
11
+ bottleneck_factor: 4
12
+ growth: 64
13
+ norm: InstanceNorm
14
+ num_blocks_per_scale: 2
15
+ num_channels: 128
16
+ num_scales: 5
17
+ num_subbands: 4
18
+ scale:
19
+ - 2
20
+ - 2
21
+ training:
22
+ batch_size: 8
23
+ grad_clip: 0
24
+ instruments:
25
+ - Vocals
26
+ - Drums
27
+ - Bass
28
+ - Other
29
+ lr: 5.0e-05
30
+ target_instrument: Vocals
31
+ inference:
32
+ batch_size: 1
33
+ dim_t: 256
34
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ min_mean_abs: 0.01
7
+ n_fft: 8192
8
+ num_channels: 2
9
+ sample_rate: 44100
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 64
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 64
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ coarse_loss_clip: true
25
+ ema_momentum: 0.999
26
+ grad_clip: null
27
+ instruments:
28
+ - Vocals
29
+ - Drums
30
+ - Bass
31
+ - Other
32
+ lr: 0.0001
33
+ num_steps: 100000
34
+ q: 0.4
35
+ target_instrument: null
36
+ inference:
37
+ batch_size: 2
38
+ dim_t: 256
39
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ min_mean_abs: 0.01
7
+ n_fft: 8192
8
+ num_channels: 2
9
+ sample_rate: 44100
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 64
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 64
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ coarse_loss_clip: false
25
+ datasets:
26
+ - ../data/moises/bleeding
27
+ ema_momentum: 0.999
28
+ grad_clip: null
29
+ instruments:
30
+ - Vocals
31
+ - Drums
32
+ - Bass
33
+ - Other
34
+ lr: 0.0001
35
+ num_steps: 150000
36
+ q: 0.93
37
+ target_instrument: null
38
+ inference:
39
+ batch_size: 2
40
+ dim_t: 256
41
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 2048
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 64
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ name: epoch_10.ckpt
23
+ training:
24
+ batch_size: 16
25
+ grad_clip: 0
26
+ instruments:
27
+ - Vocals
28
+ - Instrumental
29
+ lr: 5.0e-05
30
+ target_instrument: null
31
+ num_epochs: 100
32
+ num_steps: 1000
33
+ inference:
34
+ batch_size: 1
35
+ dim_t: 256
36
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 6144
4
+ dim_t: 128
5
+ hop_length: 2048
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 64
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 6
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 14
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 3.0e-05
29
+ target_instrument: null
30
+ num_epochs: 1000
31
+ num_steps: 1000
32
+ augmentation: 1
33
+ inference:
34
+ batch_size: 1
35
+ dim_t: 256
36
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 260096
3
+ dim_f: 6144
4
+ dim_t: 128
5
+ hop_length: 2048
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 128
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 6
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 14
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 2.0e-05
29
+ target_instrument: null
30
+ num_epochs: 1000
31
+ num_steps: 1000
32
+ augmentation: 1
33
+ inference:
34
+ batch_size: 1
35
+ dim_t: 256
36
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 6144
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 128
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 6
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 1.0e-05
29
+ target_instrument: null
30
+ num_epochs: 1000
31
+ num_steps: 1000
32
+ augmentation: 1
33
+ q: 0.95
34
+ coarse_loss_clip: true
35
+ ema_momentum: 0.999
36
+ inference:
37
+ batch_size: 1
38
+ dim_t: 256
39
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 6144
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 12288
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 128
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 6
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 0.7e-05
29
+ patience: 2
30
+ target_instrument: null
31
+ num_epochs: 1000
32
+ num_steps: 1000
33
+ augmentation: 1
34
+ q: 0.95
35
+ coarse_loss_clip: true
36
+ ema_momentum: 0.999
37
+ inference:
38
+ batch_size: 1
39
+ dim_t: 256
40
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 4096
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ n_fft: 8192
7
+ num_channels: 2
8
+ sample_rate: 44100
9
+ min_mean_abs: 0.001
10
+ model:
11
+ act: gelu
12
+ bottleneck_factor: 4
13
+ growth: 128
14
+ norm: InstanceNorm
15
+ num_blocks_per_scale: 2
16
+ num_channels: 128
17
+ num_scales: 5
18
+ num_subbands: 4
19
+ scale:
20
+ - 2
21
+ - 2
22
+ training:
23
+ batch_size: 6
24
+ grad_clip: 0
25
+ instruments:
26
+ - Vocals
27
+ - Instrumental
28
+ lr: 1.0e-05
29
+ patience: 2
30
+ reduce_factor: 0.95
31
+ target_instrument: null
32
+ num_epochs: 1000
33
+ num_steps: 1000
34
+ augmentation: 1
35
+ augmentation_type: simple1
36
+ augmentation_mix: true
37
+ q: 0.95
38
+ coarse_loss_clip: true
39
+ ema_momentum: 0.999
40
+ inference:
41
+ batch_size: 1
42
+ dim_t: 256
43
+ num_overlap: 8
MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ audio:
2
+ chunk_size: 261120
3
+ dim_f: 1024
4
+ dim_t: 256
5
+ hop_length: 1024
6
+ min_mean_abs: 0.01
7
+ n_fft: 2048
8
+ num_channels: 2
9
+ sample_rate: 44100
10
+ stereo_prob: 0.7
11
+ model:
12
+ act: gelu
13
+ bottleneck_factor: 4
14
+ growth: 64
15
+ norm: InstanceNorm
16
+ num_blocks_per_scale: 2
17
+ num_channels: 64
18
+ num_scales: 5
19
+ num_subbands: 4
20
+ scale:
21
+ - 2
22
+ - 2
23
+ training:
24
+ batch_size: 8
25
+ ema_momentum: 0.999
26
+ grad_clip: null
27
+ instruments:
28
+ - Music
29
+ - Speech
30
+ - SFX
31
+ lr: 0.0001
32
+ num_steps: 30000
33
+ target_instrument: null
34
+ inference:
35
+ batch_size: 8
36
+ dim_t: 256
37
+ instruments:
38
+ - Music
39
+ - Dialog
40
+ - Effect
41
+ num_overlap: 8
MDX_Net_Models/model_data/model_data.json ADDED
@@ -0,0 +1,351 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "0ddfc0eb5792638ad5dc27850236c246": {
3
+ "compensate": 1.035,
4
+ "mdx_dim_f_set": 2048,
5
+ "mdx_dim_t_set": 8,
6
+ "mdx_n_fft_scale_set": 6144,
7
+ "primary_stem": "Vocals"
8
+ },
9
+ "26d308f91f3423a67dc69a6d12a8793d": {
10
+ "compensate": 1.035,
11
+ "mdx_dim_f_set": 2048,
12
+ "mdx_dim_t_set": 9,
13
+ "mdx_n_fft_scale_set": 8192,
14
+ "primary_stem": "Other"
15
+ },
16
+ "2cdd429caac38f0194b133884160f2c6": {
17
+ "compensate": 1.045,
18
+ "mdx_dim_f_set": 3072,
19
+ "mdx_dim_t_set": 8,
20
+ "mdx_n_fft_scale_set": 7680,
21
+ "primary_stem": "Instrumental"
22
+ },
23
+ "2f5501189a2f6db6349916fabe8c90de": {
24
+ "compensate": 1.035,
25
+ "mdx_dim_f_set": 2048,
26
+ "mdx_dim_t_set": 8,
27
+ "mdx_n_fft_scale_set": 6144,
28
+ "primary_stem": "Vocals",
29
+ "is_karaoke": true
30
+ },
31
+ "398580b6d5d973af3120df54cee6759d": {
32
+ "compensate": 1.75,
33
+ "mdx_dim_f_set": 3072,
34
+ "mdx_dim_t_set": 8,
35
+ "mdx_n_fft_scale_set": 7680,
36
+ "primary_stem": "Vocals"
37
+ },
38
+ "488b3e6f8bd3717d9d7c428476be2d75": {
39
+ "compensate": 1.035,
40
+ "mdx_dim_f_set": 3072,
41
+ "mdx_dim_t_set": 8,
42
+ "mdx_n_fft_scale_set": 7680,
43
+ "primary_stem": "Instrumental"
44
+ },
45
+ "4910e7827f335048bdac11fa967772f9": {
46
+ "compensate": 1.035,
47
+ "mdx_dim_f_set": 2048,
48
+ "mdx_dim_t_set": 7,
49
+ "mdx_n_fft_scale_set": 4096,
50
+ "primary_stem": "Drums"
51
+ },
52
+ "53c4baf4d12c3e6c3831bb8f5b532b93": {
53
+ "compensate": 1.043,
54
+ "mdx_dim_f_set": 3072,
55
+ "mdx_dim_t_set": 8,
56
+ "mdx_n_fft_scale_set": 7680,
57
+ "primary_stem": "Vocals"
58
+ },
59
+ "5d343409ef0df48c7d78cce9f0106781": {
60
+ "compensate": 1.075,
61
+ "mdx_dim_f_set": 3072,
62
+ "mdx_dim_t_set": 8,
63
+ "mdx_n_fft_scale_set": 7680,
64
+ "primary_stem": "Vocals"
65
+ },
66
+ "5f6483271e1efb9bfb59e4a3e6d4d098": {
67
+ "compensate": 1.035,
68
+ "mdx_dim_f_set": 2048,
69
+ "mdx_dim_t_set": 9,
70
+ "mdx_n_fft_scale_set": 6144,
71
+ "primary_stem": "Vocals"
72
+ },
73
+ "65ab5919372a128e4167f5e01a8fda85": {
74
+ "compensate": 1.035,
75
+ "mdx_dim_f_set": 2048,
76
+ "mdx_dim_t_set": 8,
77
+ "mdx_n_fft_scale_set": 8192,
78
+ "primary_stem": "Other"
79
+ },
80
+ "6703e39f36f18aa7855ee1047765621d": {
81
+ "compensate": 1.035,
82
+ "mdx_dim_f_set": 2048,
83
+ "mdx_dim_t_set": 9,
84
+ "mdx_n_fft_scale_set": 16384,
85
+ "primary_stem": "Bass"
86
+ },
87
+ "6b31de20e84392859a3d09d43f089515": {
88
+ "compensate": 1.035,
89
+ "mdx_dim_f_set": 2048,
90
+ "mdx_dim_t_set": 8,
91
+ "mdx_n_fft_scale_set": 6144,
92
+ "primary_stem": "Vocals"
93
+ },
94
+ "867595e9de46f6ab699008295df62798": {
95
+ "compensate": 1.03,
96
+ "mdx_dim_f_set": 3072,
97
+ "mdx_dim_t_set": 8,
98
+ "mdx_n_fft_scale_set": 7680,
99
+ "primary_stem": "Vocals"
100
+ },
101
+ "a3cd63058945e777505c01d2507daf37": {
102
+ "compensate": 1.03,
103
+ "mdx_dim_f_set": 2048,
104
+ "mdx_dim_t_set": 8,
105
+ "mdx_n_fft_scale_set": 6144,
106
+ "primary_stem": "Vocals"
107
+ },
108
+ "b33d9b3950b6cbf5fe90a32608924700": {
109
+ "compensate": 1.03,
110
+ "mdx_dim_f_set": 3072,
111
+ "mdx_dim_t_set": 8,
112
+ "mdx_n_fft_scale_set": 7680,
113
+ "primary_stem": "Vocals"
114
+ },
115
+ "c3b29bdce8c4fa17ec609e16220330ab": {
116
+ "compensate": 1.035,
117
+ "mdx_dim_f_set": 2048,
118
+ "mdx_dim_t_set": 8,
119
+ "mdx_n_fft_scale_set": 16384,
120
+ "primary_stem": "Bass"
121
+ },
122
+ "ceed671467c1f64ebdfac8a2490d0d52": {
123
+ "compensate": 1.035,
124
+ "mdx_dim_f_set": 3072,
125
+ "mdx_dim_t_set": 8,
126
+ "mdx_n_fft_scale_set": 7680,
127
+ "primary_stem": "Instrumental"
128
+ },
129
+ "d2a1376f310e4f7fa37fb9b5774eb701": {
130
+ "compensate": 1.035,
131
+ "mdx_dim_f_set": 3072,
132
+ "mdx_dim_t_set": 8,
133
+ "mdx_n_fft_scale_set": 7680,
134
+ "primary_stem": "Instrumental"
135
+ },
136
+ "d7bff498db9324db933d913388cba6be": {
137
+ "compensate": 1.035,
138
+ "mdx_dim_f_set": 2048,
139
+ "mdx_dim_t_set": 8,
140
+ "mdx_n_fft_scale_set": 6144,
141
+ "primary_stem": "Vocals"
142
+ },
143
+ "d94058f8c7f1fae4164868ae8ae66b20": {
144
+ "compensate": 1.035,
145
+ "mdx_dim_f_set": 2048,
146
+ "mdx_dim_t_set": 8,
147
+ "mdx_n_fft_scale_set": 6144,
148
+ "primary_stem": "Vocals"
149
+ },
150
+ "dc41ede5961d50f277eb846db17f5319": {
151
+ "compensate": 1.035,
152
+ "mdx_dim_f_set": 2048,
153
+ "mdx_dim_t_set": 9,
154
+ "mdx_n_fft_scale_set": 4096,
155
+ "primary_stem": "Drums"
156
+ },
157
+ "e5572e58abf111f80d8241d2e44e7fa4": {
158
+ "compensate": 1.028,
159
+ "mdx_dim_f_set": 3072,
160
+ "mdx_dim_t_set": 8,
161
+ "mdx_n_fft_scale_set": 7680,
162
+ "primary_stem": "Instrumental"
163
+ },
164
+ "e7324c873b1f615c35c1967f912db92a": {
165
+ "compensate": 1.03,
166
+ "mdx_dim_f_set": 3072,
167
+ "mdx_dim_t_set": 8,
168
+ "mdx_n_fft_scale_set": 7680,
169
+ "primary_stem": "Vocals"
170
+ },
171
+ "1c56ec0224f1d559c42fd6fd2a67b154": {
172
+ "compensate": 1.025,
173
+ "mdx_dim_f_set": 2048,
174
+ "mdx_dim_t_set": 8,
175
+ "mdx_n_fft_scale_set": 5120,
176
+ "primary_stem": "Instrumental"
177
+ },
178
+ "f2df6d6863d8f435436d8b561594ff49": {
179
+ "compensate": 1.035,
180
+ "mdx_dim_f_set": 3072,
181
+ "mdx_dim_t_set": 8,
182
+ "mdx_n_fft_scale_set": 7680,
183
+ "primary_stem": "Instrumental"
184
+ },
185
+ "b06327a00d5e5fbc7d96e1781bbdb596": {
186
+ "compensate": 1.035,
187
+ "mdx_dim_f_set": 3072,
188
+ "mdx_dim_t_set": 8,
189
+ "mdx_n_fft_scale_set": 6144,
190
+ "primary_stem": "Instrumental"
191
+ },
192
+ "94ff780b977d3ca07c7a343dab2e25dd": {
193
+ "compensate": 1.039,
194
+ "mdx_dim_f_set": 3072,
195
+ "mdx_dim_t_set": 8,
196
+ "mdx_n_fft_scale_set": 6144,
197
+ "primary_stem": "Instrumental"
198
+ },
199
+ "73492b58195c3b52d34590d5474452f6": {
200
+ "compensate": 1.043,
201
+ "mdx_dim_f_set": 3072,
202
+ "mdx_dim_t_set": 8,
203
+ "mdx_n_fft_scale_set": 7680,
204
+ "primary_stem": "Vocals"
205
+ },
206
+ "970b3f9492014d18fefeedfe4773cb42": {
207
+ "compensate": 1.009,
208
+ "mdx_dim_f_set": 3072,
209
+ "mdx_dim_t_set": 8,
210
+ "mdx_n_fft_scale_set": 7680,
211
+ "primary_stem": "Vocals"
212
+ },
213
+ "1d64a6d2c30f709b8c9b4ce1366d96ee": {
214
+ "compensate": 1.065,
215
+ "mdx_dim_f_set": 2048,
216
+ "mdx_dim_t_set": 8,
217
+ "mdx_n_fft_scale_set": 5120,
218
+ "primary_stem": "Instrumental",
219
+ "is_karaoke": true
220
+ },
221
+ "203f2a3955221b64df85a41af87cf8f0": {
222
+ "compensate": 1.035,
223
+ "mdx_dim_f_set": 3072,
224
+ "mdx_dim_t_set": 8,
225
+ "mdx_n_fft_scale_set": 6144,
226
+ "primary_stem": "Instrumental"
227
+ },
228
+ "291c2049608edb52648b96e27eb80e95": {
229
+ "compensate": 1.035,
230
+ "mdx_dim_f_set": 3072,
231
+ "mdx_dim_t_set": 8,
232
+ "mdx_n_fft_scale_set": 6144,
233
+ "primary_stem": "Instrumental"
234
+ },
235
+ "ead8d05dab12ec571d67549b3aab03fc": {
236
+ "compensate": 1.035,
237
+ "mdx_dim_f_set": 3072,
238
+ "mdx_dim_t_set": 8,
239
+ "mdx_n_fft_scale_set": 6144,
240
+ "primary_stem": "Instrumental"
241
+ },
242
+ "cc63408db3d80b4d85b0287d1d7c9632": {
243
+ "compensate": 1.033,
244
+ "mdx_dim_f_set": 3072,
245
+ "mdx_dim_t_set": 8,
246
+ "mdx_n_fft_scale_set": 6144,
247
+ "primary_stem": "Instrumental"
248
+ },
249
+ "cd5b2989ad863f116c855db1dfe24e39": {
250
+ "compensate": 1.035,
251
+ "mdx_dim_f_set": 3072,
252
+ "mdx_dim_t_set": 9,
253
+ "mdx_n_fft_scale_set": 6144,
254
+ "primary_stem": "Reverb"
255
+ },
256
+ "55657dd70583b0fedfba5f67df11d711": {
257
+ "compensate": 1.022,
258
+ "mdx_dim_f_set": 3072,
259
+ "mdx_dim_t_set": 8,
260
+ "mdx_n_fft_scale_set": 6144,
261
+ "primary_stem": "Instrumental"
262
+ },
263
+ "b6bccda408a436db8500083ef3491e8b": {
264
+ "compensate": 1.02,
265
+ "mdx_dim_f_set": 3072,
266
+ "mdx_dim_t_set": 8,
267
+ "mdx_n_fft_scale_set": 7680,
268
+ "primary_stem": "Instrumental"
269
+ },
270
+ "8a88db95c7fb5dbe6a095ff2ffb428b1": {
271
+ "compensate": 1.026,
272
+ "mdx_dim_f_set": 2048,
273
+ "mdx_dim_t_set": 8,
274
+ "mdx_n_fft_scale_set": 5120,
275
+ "primary_stem": "Instrumental"
276
+ },
277
+ "b78da4afc6512f98e4756f5977f5c6b9": {
278
+ "compensate": 1.021,
279
+ "mdx_dim_f_set": 3072,
280
+ "mdx_dim_t_set": 8,
281
+ "mdx_n_fft_scale_set": 7680,
282
+ "primary_stem": "Instrumental"
283
+ },
284
+ "77d07b2667ddf05b9e3175941b4454a0": {
285
+ "compensate": 1.021,
286
+ "mdx_dim_f_set": 3072,
287
+ "mdx_dim_t_set": 8,
288
+ "mdx_n_fft_scale_set": 7680,
289
+ "primary_stem": "Vocals"
290
+ },
291
+ "2154254ee89b2945b97a7efed6e88820": {
292
+ "config_yaml": "model_2_stem_061321.yaml"
293
+ },
294
+ "063aadd735d58150722926dcbf5852a9": {
295
+ "config_yaml": "model_2_stem_061321.yaml"
296
+ },
297
+ "c09f714d978b41d718facfe3427e6001": {
298
+ "config_yaml": "model_2_stem_061321.yaml"
299
+ },
300
+ "fe96801369f6a148df2720f5ced88c19": {
301
+ "config_yaml": "model3.yaml"
302
+ },
303
+ "02e8b226f85fb566e5db894b9931c640": {
304
+ "config_yaml": "model2.yaml"
305
+ },
306
+ "e3de6d861635ab9c1d766149edd680d6": {
307
+ "config_yaml": "model1.yaml"
308
+ },
309
+ "3f2936c554ab73ce2e396d54636bd373": {
310
+ "config_yaml": "modelB.yaml"
311
+ },
312
+ "890d0f6f82d7574bca741a9e8bcb8168": {
313
+ "config_yaml": "modelB.yaml"
314
+ },
315
+ "63a3cb8c37c474681049be4ad1ba8815": {
316
+ "config_yaml": "modelB.yaml"
317
+ },
318
+ "a7fc5d719743c7fd6b61bd2b4d48b9f0": {
319
+ "config_yaml": "modelA.yaml"
320
+ },
321
+ "3567f3dee6e77bf366fcb1c7b8bc3745": {
322
+ "config_yaml": "modelA.yaml"
323
+ },
324
+ "a28f4d717bd0d34cd2ff7a3b0a3d065e": {
325
+ "config_yaml": "modelA.yaml"
326
+ },
327
+ "c9971a18da20911822593dc81caa8be9": {
328
+ "config_yaml": "sndfx.yaml"
329
+ },
330
+ "57d94d5ed705460d21c75a5ac829a605": {
331
+ "config_yaml": "sndfx.yaml"
332
+ },
333
+ "e7a25f8764f25a52c1b96c4946e66ba2": {
334
+ "config_yaml": "sndfx.yaml"
335
+ },
336
+ "104081d24e37217086ce5fde09147ee1": {
337
+ "config_yaml": "model_2_stem_061321.yaml"
338
+ },
339
+ "1e6165b601539f38d0a9330f3facffeb": {
340
+ "config_yaml": "model_2_stem_061321.yaml"
341
+ },
342
+ "fe0108464ce0d8271be5ab810891bd7c": {
343
+ "config_yaml": "model_2_stem_full_band.yaml"
344
+ },
345
+ "e9b82ec90ee56c507a3a982f1555714c": {
346
+ "config_yaml": "model_2_stem_full_band_2.yaml"
347
+ },
348
+ "99b6ceaae542265a3b6d657bf9fde79f": {
349
+ "config_yaml": "model_2_stem_full_band_8k.yaml"
350
+ }
351
+ }
MDX_Net_Models/model_data/model_name_mapper.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "UVR_MDXNET_1_9703": "UVR-MDX-NET 1",
3
+ "UVR_MDXNET_2_9682": "UVR-MDX-NET 2",
4
+ "UVR_MDXNET_3_9662": "UVR-MDX-NET 3",
5
+ "UVR_MDXNET_KARA": "UVR-MDX-NET Karaoke",
6
+ "UVR_MDXNET_Main": "UVR-MDX-NET Main",
7
+ "UVR-MDX-NET-Inst_1": "UVR-MDX-NET Inst 1",
8
+ "UVR-MDX-NET-Inst_2": "UVR-MDX-NET Inst 2",
9
+ "UVR-MDX-NET-Inst_3": "UVR-MDX-NET Inst 3",
10
+ "UVR-MDX-NET-Inst_4": "UVR-MDX-NET Inst 4",
11
+ "UVR-MDX-NET-Inst_Main": "UVR-MDX-NET Inst Main",
12
+ "UVR-MDX-NET-Inst_Main_2": "UVR-MDX-NET Inst Main 2",
13
+ "UVR-MDX-NET-Inst_HQ_1": "UVR-MDX-NET Inst HQ 1",
14
+ "UVR-MDX-NET-Inst_HQ_2": "UVR-MDX-NET Inst HQ 2",
15
+ "UVR-MDX-NET-Inst_HQ_3": "UVR-MDX-NET Inst HQ 3",
16
+ "UVR_MDXNET_KARA_2": "UVR-MDX-NET Karaoke 2",
17
+ "Kim_Vocal_1": "Kim Vocal 1",
18
+ "Kim_Vocal_2": "Kim Vocal 2",
19
+ "Kim_Inst": "Kim Inst",
20
+ "MDX23C-8KFFT-InstVoc_HQ.ckpt": "MDX23C-InstVoc HQ",
21
+ "Reverb_HQ_By_FoxJoy": "Reverb HQ"
22
+ }