English
music
emotion
kjysmu commited on
Commit
06db5b8
·
verified ·
1 Parent(s): 2c07aac

Upload 4 files

Browse files
config/base_config.yaml ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ version: "1.34"
2
+
3
+ lr: 1e-4
4
+ log_step: 1
5
+ split: 0
6
+ batch_size: 8
7
+ sr: 16000
8
+
9
+ datasets:
10
+ - jamendo
11
+ - emomusic
12
+ - pmemo
13
+ - deam
14
+
15
+ model:
16
+ encoder: "MERT"
17
+ layers:
18
+ - 5
19
+ - 6
20
+ classifier: "linear-mt-attn-ck"
21
+ # - linear
22
+ # - linear-attn-ck
23
+ # - linear-mt-attn-ck
24
+
25
+ kd: True
26
+ kd_weight: 0.8
27
+ kd_temperature: 1
28
+ lr: 1e-4
29
+
30
+ dataset:
31
+ jamendo:
32
+ root: './dataset/jamendo'
33
+ subset: 'moodtheme'
34
+ batch_size: 8
35
+ output_size : 56
36
+ split: 0
37
+ segment_type: "all" # [all,f10s,f30s,10s,30s]
38
+ num_workers: 4
39
+ deam:
40
+ root: './dataset/deam'
41
+ batch_size: 8
42
+ output_size : 2
43
+ segment_type: "all" # [all,f10s,f30s,10s,30s]
44
+ num_workers: 4
45
+ pmemo:
46
+ root: './dataset/pmemo'
47
+ batch_size: 8
48
+ output_size : 2
49
+ segment_type: "all" # [all,f10s,f30s,10s,30s]
50
+ num_workers: 4
51
+ emomusic:
52
+ root: './dataset/emomusic'
53
+ batch_size: 8
54
+ output_size : 2
55
+ segment_type: "all" # [all,f10s,f30s,10s,30s]
56
+ num_workers: 4
57
+
58
+ # --------------------------------------- #
59
+ genre_class_size: 87
60
+ mood_class_size: 56
61
+ instr_class_size: 40
62
+ dac_latents_size: 72
63
+ dac_rvq_size: 9
64
+ # --------------------------------------- #
65
+
66
+ checkpoint_pmemo: "tb_logs/best/P.ckpt"
67
+ checkpoint_deam: "tb_logs/best/D.ckpt"
68
+ checkpoint_emomusic: "tb_logs/best/E.ckpt"
69
+ checkpoint_jamendo: "tb_logs/best/J.ckpt"
70
+
config/prep_config.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ device_id: 3
2
+
3
+ is_split: True
4
+ segment_duration: 30
5
+
6
+ dataset:
7
+ input_dir: '../dataset/deam/mp3'
8
+ output_dir: '../dataset/deam/mert_30s'
9
+
10
+ model:
11
+ name: 'm-a-p/MERT-v1-95M'
12
+ sr: 24000
13
+
14
+
15
+
16
+
config/test_config.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ defaults:
2
+ - base_config
3
+ - _self_
4
+
5
+ batch_size: 8
6
+ devices: [0]
7
+
8
+ trainer:
9
+ devices: ${devices}
10
+ accelerator: 'gpu'
11
+
12
+ checkpoint_latest: True
13
+
14
+ multitask: True
15
+ dataset_type: "va"
16
+ checkpoint: "tb_logs/best/J.ckpt"
config/train_config.yaml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ defaults:
2
+ - base_config
3
+ - _self_
4
+
5
+ devices: [0,1,2,3]
6
+ epochs: 500
7
+ batch_size: 8
8
+
9
+ monitor_metric: "val_loss"
10
+ monitor_metric_mood: "val_loss_mood"
11
+ monitor_metric_va: "val_loss_va"
12
+
13
+ checkpoint:
14
+ monitor: "${monitor_metric}"
15
+ filename: "{epoch:02d}-{${monitor_metric}:.4f}"
16
+ save_top_k: 5
17
+ mode: "min"
18
+ auto_insert_metric_name: False
19
+ save_last: True
20
+
21
+ checkpoint_mood:
22
+ monitor: "${monitor_metric_mood}"
23
+ filename: "mood-{epoch:02d}-{${monitor_metric_mood}:.4f}"
24
+ save_top_k: 5
25
+ mode: "min"
26
+ auto_insert_metric_name: False
27
+ save_last: True
28
+
29
+ checkpoint_va:
30
+ monitor: "${monitor_metric_va}"
31
+ filename: "va-{epoch:02d}-{${monitor_metric_va}:.4f}"
32
+ save_top_k: 5
33
+ mode: "min"
34
+ auto_insert_metric_name: False
35
+ save_last: True
36
+
37
+ earlystopping:
38
+ monitor: "${monitor_metric}"
39
+ patience: 10
40
+ min_delta: 0.0001
41
+ mode: "min"
42
+
43
+ trainer:
44
+ devices: ${devices}
45
+ max_epochs: ${epochs}
46
+ accelerator: 'gpu'