diff --git a/models/MDX_Net_Models/desktop.ini b/models/MDX_Net_Models/desktop.ini new file mode 100644 index 0000000..a5431d2 --- /dev/null +++ b/models/MDX_Net_Models/desktop.ini @@ -0,0 +1,9 @@ +[LocalizedFileNames] +UVR-MDX-NET_Main_439.onnx=@UVR-MDX-NET_Main_439.onnx,0 +UVR-MDX-NET_Main_438.onnx=@UVR-MDX-NET_Main_438.onnx,0 +UVR-MDX-NET_Main_437.onnx=@UVR-MDX-NET_Main_437.onnx,0 +UVR-MDX-NET_Main_436.onnx=@UVR-MDX-NET_Main_436.onnx,0 +UVR-MDX-NET_Main_435.onnx=@UVR-MDX-NET_Main_435.onnx,0 +UVR-MDX-NET_Main_434.onnx=@UVR-MDX-NET_Main_434.onnx,0 +bass.onnx=@bass.onnx,0 +drums.onnx=@drums.onnx,0 diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model1.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model1.yaml new file mode 100644 index 0000000..4a0af14 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model1.yaml @@ -0,0 +1,34 @@ +audio: + chunk_size: 260096 + dim_f: 4096 + dim_t: 128 + hop_length: 2048 + n_fft: 8192 + num_channels: 2 + sample_rate: 44100 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 8 + grad_clip: 0 + instruments: + - Vocals + - Drums + - Bass + - Other + lr: 5.0e-05 + target_instrument: null +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model2.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model2.yaml new file mode 100644 index 0000000..304777a --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model2.yaml @@ -0,0 +1,34 @@ +audio: + chunk_size: 260096 + dim_f: 4096 + dim_t: 128 + hop_length: 2048 + n_fft: 8192 + num_channels: 2 + sample_rate: 44100 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 256 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 8 + grad_clip: 0 + instruments: + - Vocals + - Drums + - Bass + - Other + lr: 3.0e-05 + target_instrument: null +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model3.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model3.yaml new file mode 100644 index 0000000..491f6d3 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model3.yaml @@ -0,0 +1,34 @@ +audio: + chunk_size: 260096 + dim_f: 4096 + dim_t: 128 + hop_length: 2048 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 8 + grad_clip: 0 + instruments: + - Vocals + - Drums + - Bass + - Other + lr: 5.0e-05 + target_instrument: Vocals +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml new file mode 100644 index 0000000..a687be7 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml @@ -0,0 +1,39 @@ +audio: + chunk_size: 261120 + dim_f: 4096 + dim_t: 256 + hop_length: 1024 + min_mean_abs: 0.01 + n_fft: 8192 + num_channels: 2 + sample_rate: 44100 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 64 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 6 + coarse_loss_clip: true + ema_momentum: 0.999 + grad_clip: null + instruments: + - Vocals + - Drums + - Bass + - Other + lr: 0.0001 + num_steps: 100000 + q: 0.4 + target_instrument: null +inference: + batch_size: 2 + dim_t: 256 + num_overlap: 8 diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml new file mode 100644 index 0000000..a20f26e --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml @@ -0,0 +1,41 @@ +audio: + chunk_size: 261120 + dim_f: 4096 + dim_t: 256 + hop_length: 1024 + min_mean_abs: 0.01 + n_fft: 8192 + num_channels: 2 + sample_rate: 44100 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 64 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 6 + coarse_loss_clip: false + datasets: + - ../data/moises/bleeding + ema_momentum: 0.999 + grad_clip: null + instruments: + - Vocals + - Drums + - Bass + - Other + lr: 0.0001 + num_steps: 150000 + q: 0.93 + target_instrument: null +inference: + batch_size: 2 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml new file mode 100644 index 0000000..d5412e0 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml @@ -0,0 +1,36 @@ +audio: + chunk_size: 260096 + dim_f: 4096 + dim_t: 256 + hop_length: 2048 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 + name: epoch_10.ckpt +training: + batch_size: 16 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 5.0e-05 + target_instrument: null + num_epochs: 100 + num_steps: 1000 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml new file mode 100644 index 0000000..af253ed --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml @@ -0,0 +1,36 @@ +audio: + chunk_size: 260096 + dim_f: 6144 + dim_t: 128 + hop_length: 2048 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 6 + scale: + - 2 + - 2 +training: + batch_size: 14 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 3.0e-05 + target_instrument: null + num_epochs: 1000 + num_steps: 1000 + augmentation: 1 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml new file mode 100644 index 0000000..8d8dfb7 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml @@ -0,0 +1,36 @@ +audio: + chunk_size: 260096 + dim_f: 6144 + dim_t: 128 + hop_length: 2048 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 128 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 6 + scale: + - 2 + - 2 +training: + batch_size: 14 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 2.0e-05 + target_instrument: null + num_epochs: 1000 + num_steps: 1000 + augmentation: 1 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml new file mode 100644 index 0000000..c139474 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml @@ -0,0 +1,39 @@ +audio: + chunk_size: 261120 + dim_f: 6144 + dim_t: 256 + hop_length: 1024 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 128 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 6 + scale: + - 2 + - 2 +training: + batch_size: 6 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 1.0e-05 + target_instrument: null + num_epochs: 1000 + num_steps: 1000 + augmentation: 1 + q: 0.95 + coarse_loss_clip: true + ema_momentum: 0.999 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml new file mode 100644 index 0000000..783d622 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml @@ -0,0 +1,40 @@ +audio: + chunk_size: 261120 + dim_f: 6144 + dim_t: 256 + hop_length: 1024 + n_fft: 12288 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 128 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 6 + scale: + - 2 + - 2 +training: + batch_size: 6 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 0.7e-05 + patience: 2 + target_instrument: null + num_epochs: 1000 + num_steps: 1000 + augmentation: 1 + q: 0.95 + coarse_loss_clip: true + ema_momentum: 0.999 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml new file mode 100644 index 0000000..207aa71 --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml @@ -0,0 +1,43 @@ +audio: + chunk_size: 261120 + dim_f: 4096 + dim_t: 256 + hop_length: 1024 + n_fft: 8192 + num_channels: 2 + sample_rate: 44100 + min_mean_abs: 0.001 +model: + act: gelu + bottleneck_factor: 4 + growth: 128 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 128 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 6 + grad_clip: 0 + instruments: + - Vocals + - Instrumental + lr: 1.0e-05 + patience: 2 + reduce_factor: 0.95 + target_instrument: null + num_epochs: 1000 + num_steps: 1000 + augmentation: 1 + augmentation_type: simple1 + augmentation_mix: true + q: 0.95 + coarse_loss_clip: true + ema_momentum: 0.999 +inference: + batch_size: 1 + dim_t: 256 + num_overlap: 8 \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml b/models/MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml new file mode 100644 index 0000000..75fccad --- /dev/null +++ b/models/MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml @@ -0,0 +1,41 @@ +audio: + chunk_size: 261120 + dim_f: 1024 + dim_t: 256 + hop_length: 1024 + min_mean_abs: 0.01 + n_fft: 2048 + num_channels: 2 + sample_rate: 44100 + stereo_prob: 0.7 +model: + act: gelu + bottleneck_factor: 4 + growth: 64 + norm: InstanceNorm + num_blocks_per_scale: 2 + num_channels: 64 + num_scales: 5 + num_subbands: 4 + scale: + - 2 + - 2 +training: + batch_size: 8 + ema_momentum: 0.999 + grad_clip: null + instruments: + - Music + - Speech + - SFX + lr: 0.0001 + num_steps: 30000 + target_instrument: null +inference: + batch_size: 8 + dim_t: 256 + instruments: + - Music + - Dialog + - Effect + num_overlap: 8 diff --git a/models/MDX_Net_Models/model_data/model_data.json b/models/MDX_Net_Models/model_data/model_data.json index 309fe07..dc33f4d 100644 --- a/models/MDX_Net_Models/model_data/model_data.json +++ b/models/MDX_Net_Models/model_data/model_data.json @@ -14,7 +14,7 @@ "primary_stem": "Other" }, "2cdd429caac38f0194b133884160f2c6": { - "compensate": 1.035, + "compensate": 1.045, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, @@ -25,7 +25,8 @@ "mdx_dim_f_set": 2048, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 6144, - "primary_stem": "Vocals" + "primary_stem": "Vocals", + "is_karaoke": true }, "398580b6d5d973af3120df54cee6759d": { "compensate": 1.75, @@ -49,7 +50,7 @@ "primary_stem": "Drums" }, "53c4baf4d12c3e6c3831bb8f5b532b93": { - "compensate": 1.035, + "compensate": 1.043, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, @@ -91,21 +92,21 @@ "primary_stem": "Vocals" }, "867595e9de46f6ab699008295df62798": { - "compensate": 1.075, + "compensate": 1.03, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, "primary_stem": "Vocals" }, "a3cd63058945e777505c01d2507daf37": { - "compensate": 1.035, + "compensate": 1.03, "mdx_dim_f_set": 2048, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 6144, "primary_stem": "Vocals" }, "b33d9b3950b6cbf5fe90a32608924700": { - "compensate": 1.075, + "compensate": 1.03, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, @@ -154,21 +155,21 @@ "primary_stem": "Drums" }, "e5572e58abf111f80d8241d2e44e7fa4": { - "compensate": 1.035, + "compensate": 1.028, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, "primary_stem": "Instrumental" }, "e7324c873b1f615c35c1967f912db92a": { - "compensate": 1.075, + "compensate": 1.03, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, "primary_stem": "Vocals" }, "1c56ec0224f1d559c42fd6fd2a67b154": { - "compensate": 1.035, + "compensate": 1.025, "mdx_dim_f_set": 2048, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 5120, @@ -189,25 +190,33 @@ "primary_stem": "Instrumental" }, "94ff780b977d3ca07c7a343dab2e25dd": { - "compensate": 1.035, + "compensate": 1.039, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 6144, "primary_stem": "Instrumental" }, "73492b58195c3b52d34590d5474452f6": { - "compensate": 1.075, + "compensate": 1.043, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 7680, + "primary_stem": "Vocals" + }, + "970b3f9492014d18fefeedfe4773cb42": { + "compensate": 1.009, "mdx_dim_f_set": 3072, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 7680, "primary_stem": "Vocals" }, "1d64a6d2c30f709b8c9b4ce1366d96ee": { - "compensate": 1.035, + "compensate": 1.065, "mdx_dim_f_set": 2048, "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 5120, - "primary_stem": "Instrumental" + "primary_stem": "Instrumental", + "is_karaoke": true }, "203f2a3955221b64df85a41af87cf8f0": { "compensate": 1.035, @@ -229,5 +238,114 @@ "mdx_dim_t_set": 8, "mdx_n_fft_scale_set": 6144, "primary_stem": "Instrumental" + }, + "cc63408db3d80b4d85b0287d1d7c9632": { + "compensate": 1.033, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 6144, + "primary_stem": "Instrumental" + }, + "cd5b2989ad863f116c855db1dfe24e39": { + "compensate": 1.035, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 9, + "mdx_n_fft_scale_set": 6144, + "primary_stem": "Reverb" + }, + "55657dd70583b0fedfba5f67df11d711": { + "compensate": 1.022, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 6144, + "primary_stem": "Instrumental" + }, + "b6bccda408a436db8500083ef3491e8b": { + "compensate": 1.02, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 7680, + "primary_stem": "Instrumental" + }, + "8a88db95c7fb5dbe6a095ff2ffb428b1": { + "compensate": 1.026, + "mdx_dim_f_set": 2048, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 5120, + "primary_stem": "Instrumental" + }, + "b78da4afc6512f98e4756f5977f5c6b9": { + "compensate": 1.021, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 7680, + "primary_stem": "Instrumental" + }, + "77d07b2667ddf05b9e3175941b4454a0": { + "compensate": 1.021, + "mdx_dim_f_set": 3072, + "mdx_dim_t_set": 8, + "mdx_n_fft_scale_set": 7680, + "primary_stem": "Vocals" + }, + "2154254ee89b2945b97a7efed6e88820": { + "config_yaml": "model_2_stem_061321.yaml" + }, + "063aadd735d58150722926dcbf5852a9": { + "config_yaml": "model_2_stem_061321.yaml" + }, + "c09f714d978b41d718facfe3427e6001": { + "config_yaml": "model_2_stem_061321.yaml" + }, + "fe96801369f6a148df2720f5ced88c19": { + "config_yaml": "model3.yaml" + }, + "02e8b226f85fb566e5db894b9931c640": { + "config_yaml": "model2.yaml" + }, + "e3de6d861635ab9c1d766149edd680d6": { + "config_yaml": "model1.yaml" + }, + "3f2936c554ab73ce2e396d54636bd373": { + "config_yaml": "modelB.yaml" + }, + "890d0f6f82d7574bca741a9e8bcb8168": { + "config_yaml": "modelB.yaml" + }, + "63a3cb8c37c474681049be4ad1ba8815": { + "config_yaml": "modelB.yaml" + }, + "a7fc5d719743c7fd6b61bd2b4d48b9f0": { + "config_yaml": "modelA.yaml" + }, + "3567f3dee6e77bf366fcb1c7b8bc3745": { + "config_yaml": "modelA.yaml" + }, + "a28f4d717bd0d34cd2ff7a3b0a3d065e": { + "config_yaml": "modelA.yaml" + }, + "c9971a18da20911822593dc81caa8be9": { + "config_yaml": "sndfx.yaml" + }, + "57d94d5ed705460d21c75a5ac829a605": { + "config_yaml": "sndfx.yaml" + }, + "e7a25f8764f25a52c1b96c4946e66ba2": { + "config_yaml": "sndfx.yaml" + }, + "104081d24e37217086ce5fde09147ee1": { + "config_yaml": "model_2_stem_061321.yaml" + }, + "1e6165b601539f38d0a9330f3facffeb": { + "config_yaml": "model_2_stem_061321.yaml" + }, + "fe0108464ce0d8271be5ab810891bd7c": { + "config_yaml": "model_2_stem_full_band.yaml" + }, + "e9b82ec90ee56c507a3a982f1555714c": { + "config_yaml": "model_2_stem_full_band_2.yaml" + }, + "99b6ceaae542265a3b6d657bf9fde79f": { + "config_yaml": "model_2_stem_full_band_8k.yaml" } } \ No newline at end of file diff --git a/models/MDX_Net_Models/model_data/model_name_mapper.json b/models/MDX_Net_Models/model_data/model_name_mapper.json index 0f18f6d..1476ad0 100644 --- a/models/MDX_Net_Models/model_data/model_name_mapper.json +++ b/models/MDX_Net_Models/model_data/model_name_mapper.json @@ -7,7 +7,16 @@ "UVR-MDX-NET-Inst_1": "UVR-MDX-NET Inst 1", "UVR-MDX-NET-Inst_2": "UVR-MDX-NET Inst 2", "UVR-MDX-NET-Inst_3": "UVR-MDX-NET Inst 3", + "UVR-MDX-NET-Inst_4": "UVR-MDX-NET Inst 4", "UVR-MDX-NET-Inst_Main": "UVR-MDX-NET Inst Main", + "UVR-MDX-NET-Inst_Main_2": "UVR-MDX-NET Inst Main 2", "UVR-MDX-NET-Inst_HQ_1": "UVR-MDX-NET Inst HQ 1", - "UVR_MDXNET_KARA_2": "UVR-MDX-NET Karaoke 2" + "UVR-MDX-NET-Inst_HQ_2": "UVR-MDX-NET Inst HQ 2", + "UVR-MDX-NET-Inst_HQ_3": "UVR-MDX-NET Inst HQ 3", + "UVR_MDXNET_KARA_2": "UVR-MDX-NET Karaoke 2", + "Kim_Vocal_1": "Kim Vocal 1", + "Kim_Vocal_2": "Kim Vocal 2", + "Kim_Inst": "Kim Inst", + "MDX23C-8KFFT-InstVoc_HQ.ckpt": "MDX23C-InstVoc HQ", + "Reverb_HQ_By_FoxJoy": "Reverb HQ" } \ No newline at end of file diff --git a/models/VR_Models/UVR-DeNoise-Lite.pth b/models/VR_Models/UVR-DeNoise-Lite.pth new file mode 100644 index 0000000..195c193 Binary files /dev/null and b/models/VR_Models/UVR-DeNoise-Lite.pth differ diff --git a/models/VR_Models/model_data/model_data.json b/models/VR_Models/model_data/model_data.json index b1abb2c..2ff77d0 100644 --- a/models/VR_Models/model_data/model_data.json +++ b/models/VR_Models/model_data/model_data.json @@ -13,7 +13,7 @@ }, "2aa34fbc01f8e6d2bf509726481e7142": { "vr_model_param": "4band_44100", - "primary_stem": "Other" + "primary_stem": "No Piano" }, "3e18f639b11abea7361db1a4a91c2559": { "vr_model_param": "4band_44100", @@ -29,7 +29,8 @@ }, "6b5916069a49be3fe29d4397ecfd73fa": { "vr_model_param": "3band_44100_msb2", - "primary_stem": "Instrumental" + "primary_stem": "Instrumental", + "is_karaoke": true }, "74b3bc5fa2b69f29baf7839b858bc679": { "vr_model_param": "4band_44100", @@ -85,10 +86,52 @@ }, "f6ea8473ff86017b5ebd586ccacf156b": { "vr_model_param": "4band_v2_sn", - "primary_stem": "Instrumental" + "primary_stem": "Instrumental", + "is_karaoke": true }, "fd297a61eafc9d829033f8b987c39a3d": { "vr_model_param": "1band_sr32000_hl512", "primary_stem": "Instrumental" + }, + "0ec76fd9e65f81d8b4fbd13af4826ed8": { + "vr_model_param": "4band_v3", + "primary_stem": "No Woodwinds" + }, + "0fb9249ffe4ffc38d7b16243f394c0ff": { + "vr_model_param": "4band_v3", + "primary_stem": "No Reverb" + }, + "6857b2972e1754913aad0c9a1678c753": { + "vr_model_param": "4band_v3", + "primary_stem": "Echo", + "nout": 48, + "nout_lstm": 128 + }, + "f200a145434efc7dcf0cd093f517ed52": { + "vr_model_param": "4band_v3", + "primary_stem": "No Echo", + "nout": 48, + "nout_lstm": 128 + }, + "44c55d8b5d2e3edea98c2b2bf93071c7": { + "vr_model_param": "4band_v3", + "primary_stem": "Noise", + "nout": 48, + "nout_lstm": 128 + }, + "51ea8c43a6928ed3c10ef5cb2707d57b": { + "vr_model_param": "1band_sr44100_hl1024", + "primary_stem": "Noise", + "nout": 16, + "nout_lstm": 128 + }, + "944950a9c5963a5eb70b445d67b7068a": { + "vr_model_param": "4band_v3_sn", + "primary_stem": "Vocals", + "nout": 64, + "nout_lstm": 128, + "is_karaoke": false, + "is_bv_model": true, + "is_bv_model_rebalanced": 0.9 } } \ No newline at end of file