coverhunter_finetune.yaml
936 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
model:
name: coverhunter_finetune
embed_dim: 256
channels: 512
se_channels: 128
res2net_scale: 8
num_blocks: 3
n_mels: 128
aam_m: 0.2
aam_s: 30.0
use_band_split: false
band_split_channels: 128
use_dual_stream: true
mert_melody_branch: true
ecapa_branch: true
coverhunter_heads: 8
coverhunter_layers: 4
fusion_hidden_dim: 256
mert_model_name: m-a-p/MERT-v1-95M
data:
sample_rate: 16000
n_fft: 512
hop_length: 160
segment_dur: 8.0
crop_per_song: 6
training:
batch_size: 16
epochs: 30
lr: 0.0002
weight_decay: 0.0001
warmup_epochs: 3
temperature: 0.05
supcon_weight: 1.0
aam_weight: 0.2
mixed_precision: true
gradient_clip: 1.0
save_every: 5
log_every: 10
hard_negative_k: 4
sample_type_weights:
default: 1
compressed: 2
recording: 3
environment: 4
pair_type_weights:
default: 1.0
compressed: 1.5
recording: 2.0
environment: 3.0