MVSEP-MDX23-music-separation-model

Running

Yeluo0204 commited on Nov 4, 2024

Commit

c9fe986

verified ·

1 Parent(s): 0af3599

Upload 6 files

Files changed (5) hide show

models/MDX23C-8KFFT-InstVoc_HQ.ckpt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:49d51472769e34a2501cd1da782346a3212555c3a5619fc2c53507445528d816
+size 448101203

models/UVR-MDX-NET-Voc_FT.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:534b2070fcc7df514b13ef660dc8cbb328679c2374d04354a5c42bb14ecce111
+size 66762490

models/UVR_MDX_Instr_HQ3.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:317554b07fe1ea5279a77f2b1520a41ea4b93432560c4ffd08792c30fddf9adc
+size 66759214

models/model_2_stem_061321.yaml ADDED Viewed

+audio:
+  chunk_size: 260096
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 2048
+  n_fft: 12288
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 64
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+  name: epoch_10.ckpt
+training:
+  batch_size: 16
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 5.0e-05
+  target_instrument: null
+  num_epochs: 100
+  num_steps: 1000
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8

models/model_2_stem_full_band_8k.yaml ADDED Viewed

+audio:
+  chunk_size: 261120
+  dim_f: 4096
+  dim_t: 256
+  hop_length: 1024
+  n_fft: 8192
+  num_channels: 2
+  sample_rate: 44100
+  min_mean_abs: 0.001
+model:
+  act: gelu
+  bottleneck_factor: 4
+  growth: 128
+  norm: InstanceNorm
+  num_blocks_per_scale: 2
+  num_channels: 128
+  num_scales: 5
+  num_subbands: 4
+  scale:
+  - 2
+  - 2
+training:
+  batch_size: 6
+  grad_clip: 0
+  instruments:
+  - Vocals
+  - Instrumental
+  lr: 1.0e-05
+  patience: 2
+  reduce_factor: 0.95
+  target_instrument: null
+  num_epochs: 1000
+  num_steps: 1000
+  augmentation: 1
+  augmentation_type: simple1
+  augmentation_mix: true
+  q: 0.95
+  coarse_loss_clip: true
+  ema_momentum: 0.999
+inference:
+  batch_size: 1
+  dim_t: 256
+  num_overlap: 8