coverhunter_finetune.yaml 936 Bytes
model:
  name: coverhunter_finetune
  embed_dim: 256
  channels: 512
  se_channels: 128
  res2net_scale: 8
  num_blocks: 3
  n_mels: 128
  aam_m: 0.2
  aam_s: 30.0
  use_band_split: false
  band_split_channels: 128
  use_dual_stream: true
  mert_melody_branch: true
  ecapa_branch: true
  coverhunter_heads: 8
  coverhunter_layers: 4
  fusion_hidden_dim: 256
  mert_model_name: m-a-p/MERT-v1-95M

data:
  sample_rate: 16000
  n_fft: 512
  hop_length: 160
  segment_dur: 8.0
  crop_per_song: 6

training:
  batch_size: 16
  epochs: 30
  lr: 0.0002
  weight_decay: 0.0001
  warmup_epochs: 3
  temperature: 0.05
  supcon_weight: 1.0
  aam_weight: 0.2
  mixed_precision: true
  gradient_clip: 1.0
  save_every: 5
  log_every: 10
  hard_negative_k: 4
  sample_type_weights:
    default: 1
    compressed: 2
    recording: 3
    environment: 4
  pair_type_weights:
    default: 1.0
    compressed: 1.5
    recording: 2.0
    environment: 3.0