coverhunter_finetune_4gb.yaml 940 Bytes
model:
  name: coverhunter_finetune_lowmem
  embed_dim: 192
  channels: 256
  se_channels: 64
  res2net_scale: 4
  num_blocks: 2
  n_mels: 96
  aam_m: 0.2
  aam_s: 24.0
  use_band_split: false
  band_split_channels: 64
  use_dual_stream: true
  mert_melody_branch: true
  ecapa_branch: true
  coverhunter_heads: 4
  coverhunter_layers: 2
  fusion_hidden_dim: 128
  mert_model_name: m-a-p/MERT-v1-95M

data:
  sample_rate: 16000
  n_fft: 512
  hop_length: 160
  segment_dur: 5.0
  crop_per_song: 4

training:
  batch_size: 2
  epochs: 20
  lr: 0.00015
  weight_decay: 0.0001
  warmup_epochs: 2
  temperature: 0.05
  supcon_weight: 1.0
  aam_weight: 0.2
  mixed_precision: true
  gradient_clip: 1.0
  save_every: 5
  log_every: 10
  hard_negative_k: 2
  sample_type_weights:
    default: 1
    compressed: 2
    recording: 3
    environment: 4
  pair_type_weights:
    default: 1.0
    compressed: 1.4
    recording: 1.8
    environment: 2.2