Ultimate-Vocal-Remover-WebUI

Sleeping

App Files Files Community

next-playground commited on Jun 27, 2024

Commit

5528da5

verified ·

1 Parent(s): c890f94

Upload 12 files

Browse files

Files changed (12) hide show

models/MDX_Net_Models/model_data/mdx_c_configs/model1.yaml +34 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model2.yaml +34 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model3.yaml +34 -0
models/MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml +39 -0
models/MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml +41 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml +36 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml +36 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml +36 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml +39 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml +40 -0
models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml +43 -0
models/MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml +41 -0

models/MDX_Net_Models/model_data/mdx_c_configs/model1.yaml ADDED Viewed

	@@ -0,0 +1,34 @@

+audio:
+  chunk_size: 260096
+  dim_f: 4096
+  dim_t: 128
+  hop_length: 2048
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 8
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Drums
+  - Bass
+  - Other
+  lr: 5.0e-05
+  target_instrument: null
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model2.yaml ADDED Viewed

	@@ -0,0 +1,34 @@

+audio:
+  chunk_size: 260096
+  dim_f: 4096
+  dim_t: 128
+  hop_length: 2048
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 256
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 8
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Drums
+  - Bass
+  - Other
+  lr: 3.0e-05
+  target_instrument: null
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model3.yaml ADDED Viewed

	@@ -0,0 +1,34 @@

+audio:
+  chunk_size: 260096
+  dim_f: 4096
+  dim_t: 128
+  hop_length: 2048
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 8
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Drums
+  - Bass
+  - Other
+  lr: 5.0e-05
+  target_instrument: Vocals
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/modelA.yaml ADDED Viewed

	@@ -0,0 +1,39 @@

+audio:
+  chunk_size: 261120
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 1024
+  min_mean_abs: 0.01
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 64
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  coarse_loss_clip: true
+  ema_momentum: 0.999
+  grad_clip: null
+  instruments:
+  - Vocals
+  - Drums
+  - Bass
+  - Other
+  lr: 0.0001
+  num_steps: 100000
+  q: 0.4
+  target_instrument: null
+inference:
+  batch_size: 2
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/modelB.yaml ADDED Viewed

	@@ -0,0 +1,41 @@

+audio:
+  chunk_size: 261120
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 1024
+  min_mean_abs: 0.01
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 64
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  coarse_loss_clip: false
+  datasets:
+  - ../data/moises/bleeding
+  ema_momentum: 0.999
+  grad_clip: null
+  instruments:
+  - Vocals
+  - Drums
+  - Bass
+  - Other
+  lr: 0.0001
+  num_steps: 150000
+  q: 0.93
+  target_instrument: null
+inference:
+  batch_size: 2
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_061321.yaml ADDED Viewed

	@@ -0,0 +1,36 @@

+audio:
+  chunk_size: 260096
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 2048
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+  name: epoch_10.ckpt
+training:
+  batch_size: 16
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 5.0e-05
+  target_instrument: null
+  num_epochs: 100
+  num_steps: 1000
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band.yaml ADDED Viewed

	@@ -0,0 +1,36 @@

+audio:
+  chunk_size: 260096
+  dim_f: 6144
+  dim_t: 128
+  hop_length: 2048
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 6
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 14
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 3.0e-05
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_2.yaml ADDED Viewed

	@@ -0,0 +1,36 @@

+audio:
+  chunk_size: 260096
+  dim_f: 6144
+  dim_t: 128
+  hop_length: 2048
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 128
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 6
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 14
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 2.0e-05
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_3.yaml ADDED Viewed

	@@ -0,0 +1,39 @@

+audio:
+  chunk_size: 261120
+  dim_f: 6144
+  dim_t: 256
+  hop_length: 1024
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 128
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 6
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 1.0e-05
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+  q: 0.95
+  coarse_loss_clip: true
+  ema_momentum: 0.999
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_4.yaml ADDED Viewed

	@@ -0,0 +1,40 @@

+audio:
+  chunk_size: 261120
+  dim_f: 6144
+  dim_t: 256
+  hop_length: 1024
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 128
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 6
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 0.7e-05
+  patience: 2
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+  q: 0.95
+  coarse_loss_clip: true
+  ema_momentum: 0.999
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/model_2_stem_full_band_8k.yaml ADDED Viewed

	@@ -0,0 +1,43 @@

+audio:
+  chunk_size: 261120
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 1024
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 128
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 1.0e-05
+  patience: 2
+  reduce_factor: 0.95
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+  augmentation_type: simple1
+  augmentation_mix: true
+  q: 0.95
+  coarse_loss_clip: true
+  ema_momentum: 0.999
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/MDX_Net_Models/model_data/mdx_c_configs/sndfx.yaml ADDED Viewed

	@@ -0,0 +1,41 @@

+audio:
+  chunk_size: 261120
+  dim_f: 1024
+  dim_t: 256
+  hop_length: 1024
+  min_mean_abs: 0.01
+  n_fft: 2048
+  num_channels: 2
+  sample_rate: 44100
+  stereo_prob: 0.7
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 64
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 8
+  ema_momentum: 0.999
+  grad_clip: null
+  instruments:
+  - Music
+  - Speech
+  - SFX
+  lr: 0.0001
+  num_steps: 30000
+  target_instrument: null
+inference:
+  batch_size: 8
+  dim_t: 256
+  instruments:
+  - Music
+  - Dialog
+  - Effect
+  num_overlap: 8