lusciniaweldmou commited on
Commit
2b96093
1 Parent(s): 2eaafce

End of training

Browse files
Files changed (5) hide show
  1. README.md +6 -1
  2. all_results.json +11 -11
  3. eval_results.json +6 -6
  4. train_results.json +6 -6
  5. trainer_state.json +117 -33
README.md CHANGED
@@ -3,6 +3,8 @@ library_name: peft
3
  license: cc-by-nc-4.0
4
  base_model: facebook/musicgen-melody
5
  tags:
 
 
6
  - generated_from_trainer
7
  model-index:
8
  - name: musicgen-melody-lora-punk
@@ -14,7 +16,10 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # musicgen-melody-lora-punk
16
 
17
- This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on an unknown dataset.
 
 
 
18
 
19
  ## Model description
20
 
 
3
  license: cc-by-nc-4.0
4
  base_model: facebook/musicgen-melody
5
  tags:
6
+ - text-to-audio
7
+ - ylacombe/tiny-punk
8
  - generated_from_trainer
9
  model-index:
10
  - name: musicgen-melody-lora-punk
 
16
 
17
  # musicgen-melody-lora-punk
18
 
19
+ This model is a fine-tuned version of [facebook/musicgen-melody](https://huggingface.co/facebook/musicgen-melody) on the YLACOMBE/TINY-PUNK - DEFAULT dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 5.4128
22
+ - Clap: -0.0280
23
 
24
  ## Model description
25
 
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 2.9411764705882355,
3
- "eval_clap": 0.033477772027254105,
4
- "eval_loss": 4.728214263916016,
5
- "eval_runtime": 135.5997,
6
  "eval_samples": 5,
7
- "eval_samples_per_second": 0.037,
8
- "eval_steps_per_second": 0.037,
9
- "total_flos": 2716162948296.0,
10
- "train_loss": 7.037385880947113,
11
- "train_runtime": 240.9049,
12
  "train_samples": 33,
13
- "train_samples_per_second": 0.548,
14
- "train_steps_per_second": 0.033
15
  }
 
1
  {
2
+ "epoch": 6.9411764705882355,
3
+ "eval_clap": -0.02799578569829464,
4
+ "eval_loss": 5.412776947021484,
5
+ "eval_runtime": 129.9186,
6
  "eval_samples": 5,
7
+ "eval_samples_per_second": 0.038,
8
+ "eval_steps_per_second": 0.038,
9
+ "total_flos": 6374668143960.0,
10
+ "train_loss": 5.936464631557465,
11
+ "train_runtime": 569.9677,
12
  "train_samples": 33,
13
+ "train_samples_per_second": 0.579,
14
+ "train_steps_per_second": 0.035
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 2.9411764705882355,
3
- "eval_clap": 0.033477772027254105,
4
- "eval_loss": 4.728214263916016,
5
- "eval_runtime": 135.5997,
6
  "eval_samples": 5,
7
- "eval_samples_per_second": 0.037,
8
- "eval_steps_per_second": 0.037
9
  }
 
1
  {
2
+ "epoch": 6.9411764705882355,
3
+ "eval_clap": -0.02799578569829464,
4
+ "eval_loss": 5.412776947021484,
5
+ "eval_runtime": 129.9186,
6
  "eval_samples": 5,
7
+ "eval_samples_per_second": 0.038,
8
+ "eval_steps_per_second": 0.038
9
  }
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 2.9411764705882355,
3
- "total_flos": 2716162948296.0,
4
- "train_loss": 7.037385880947113,
5
- "train_runtime": 240.9049,
6
  "train_samples": 33,
7
- "train_samples_per_second": 0.548,
8
- "train_steps_per_second": 0.033
9
  }
 
1
  {
2
+ "epoch": 6.9411764705882355,
3
+ "total_flos": 6374668143960.0,
4
+ "train_loss": 5.936464631557465,
5
+ "train_runtime": 569.9677,
6
  "train_samples": 33,
7
+ "train_samples_per_second": 0.579,
8
+ "train_steps_per_second": 0.035
9
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9411764705882355,
5
  "eval_steps": 25,
6
- "global_step": 8,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,73 +11,157 @@
11
  {
12
  "epoch": 0.47058823529411764,
13
  "grad_norm": 1.2416200637817383,
14
- "learning_rate": 0.000175,
15
  "loss": 9.549,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.9411764705882353,
20
- "grad_norm": 1.1443309783935547,
21
- "learning_rate": 0.00015000000000000001,
22
  "loss": 9.4063,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 1.0,
27
- "grad_norm": 0.24926307797431946,
28
- "learning_rate": 0.000125,
29
- "loss": 1.1469,
30
  "step": 3
31
  },
32
  {
33
  "epoch": 1.4705882352941178,
34
- "grad_norm": 1.338173270225525,
35
- "learning_rate": 0.0001,
36
- "loss": 9.0306,
37
  "step": 4
38
  },
39
  {
40
  "epoch": 1.9411764705882353,
41
- "grad_norm": 1.4633773565292358,
42
- "learning_rate": 7.500000000000001e-05,
43
- "loss": 8.8971,
44
  "step": 5
45
  },
46
  {
47
  "epoch": 2.0,
48
- "grad_norm": 0.34096652269363403,
49
- "learning_rate": 5e-05,
50
- "loss": 1.0705,
51
  "step": 6
52
  },
53
  {
54
  "epoch": 2.4705882352941178,
55
- "grad_norm": 3.1844749450683594,
56
- "learning_rate": 2.5e-05,
57
- "loss": 8.6416,
58
  "step": 7
59
  },
60
  {
61
  "epoch": 2.9411764705882355,
62
- "grad_norm": 2.062983274459839,
63
- "learning_rate": 0.0,
64
- "loss": 8.5571,
65
  "step": 8
66
  },
67
  {
68
- "epoch": 2.9411764705882355,
69
- "step": 8,
70
- "total_flos": 2716162948296.0,
71
- "train_loss": 7.037385880947113,
72
- "train_runtime": 240.9049,
73
- "train_samples_per_second": 0.548,
74
- "train_steps_per_second": 0.033
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
75
  }
76
  ],
77
  "logging_steps": 1.0,
78
- "max_steps": 8,
79
  "num_input_tokens_seen": 0,
80
- "num_train_epochs": 4,
81
  "save_steps": 500,
82
  "stateful_callbacks": {
83
  "TrainerControl": {
@@ -91,7 +175,7 @@
91
  "attributes": {}
92
  }
93
  },
94
- "total_flos": 2716162948296.0,
95
  "train_batch_size": 2,
96
  "trial_name": null,
97
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.9411764705882355,
5
  "eval_steps": 25,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 0.47058823529411764,
13
  "grad_norm": 1.2416200637817383,
14
+ "learning_rate": 0.00019,
15
  "loss": 9.549,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.9411764705882353,
20
+ "grad_norm": 1.1442307233810425,
21
+ "learning_rate": 0.00018,
22
  "loss": 9.4063,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 1.0,
27
+ "grad_norm": 0.243339404463768,
28
+ "learning_rate": 0.00017,
29
+ "loss": 1.1454,
30
  "step": 3
31
  },
32
  {
33
  "epoch": 1.4705882352941178,
34
+ "grad_norm": 1.3809175491333008,
35
+ "learning_rate": 0.00016,
36
+ "loss": 8.9806,
37
  "step": 4
38
  },
39
  {
40
  "epoch": 1.9411764705882353,
41
+ "grad_norm": 1.642061710357666,
42
+ "learning_rate": 0.00015000000000000001,
43
+ "loss": 8.7867,
44
  "step": 5
45
  },
46
  {
47
  "epoch": 2.0,
48
+ "grad_norm": 0.38183221220970154,
49
+ "learning_rate": 0.00014,
50
+ "loss": 1.0387,
51
  "step": 6
52
  },
53
  {
54
  "epoch": 2.4705882352941178,
55
+ "grad_norm": 2.3962018489837646,
56
+ "learning_rate": 0.00013000000000000002,
57
+ "loss": 8.2484,
58
  "step": 7
59
  },
60
  {
61
  "epoch": 2.9411764705882355,
62
+ "grad_norm": 2.1051485538482666,
63
+ "learning_rate": 0.00012,
64
+ "loss": 8.011,
65
  "step": 8
66
  },
67
  {
68
+ "epoch": 3.0,
69
+ "grad_norm": 0.2919195592403412,
70
+ "learning_rate": 0.00011000000000000002,
71
+ "loss": 0.9644,
72
+ "step": 9
73
+ },
74
+ {
75
+ "epoch": 3.4705882352941178,
76
+ "grad_norm": 1.3799338340759277,
77
+ "learning_rate": 0.0001,
78
+ "loss": 7.6546,
79
+ "step": 10
80
+ },
81
+ {
82
+ "epoch": 3.9411764705882355,
83
+ "grad_norm": 1.087898850440979,
84
+ "learning_rate": 9e-05,
85
+ "loss": 7.6277,
86
+ "step": 11
87
+ },
88
+ {
89
+ "epoch": 4.0,
90
+ "grad_norm": 0.2198086678981781,
91
+ "learning_rate": 8e-05,
92
+ "loss": 0.9398,
93
+ "step": 12
94
+ },
95
+ {
96
+ "epoch": 4.470588235294118,
97
+ "grad_norm": 0.8964143395423889,
98
+ "learning_rate": 7e-05,
99
+ "loss": 7.5336,
100
+ "step": 13
101
+ },
102
+ {
103
+ "epoch": 4.9411764705882355,
104
+ "grad_norm": 0.7436186671257019,
105
+ "learning_rate": 6e-05,
106
+ "loss": 7.4136,
107
+ "step": 14
108
+ },
109
+ {
110
+ "epoch": 5.0,
111
+ "grad_norm": 0.4537833034992218,
112
+ "learning_rate": 5e-05,
113
+ "loss": 0.9229,
114
+ "step": 15
115
+ },
116
+ {
117
+ "epoch": 5.470588235294118,
118
+ "grad_norm": 0.8003455996513367,
119
+ "learning_rate": 4e-05,
120
+ "loss": 7.3806,
121
+ "step": 16
122
+ },
123
+ {
124
+ "epoch": 5.9411764705882355,
125
+ "grad_norm": 0.8167087435722351,
126
+ "learning_rate": 3e-05,
127
+ "loss": 7.4289,
128
+ "step": 17
129
+ },
130
+ {
131
+ "epoch": 6.0,
132
+ "grad_norm": 0.3596856892108917,
133
+ "learning_rate": 2e-05,
134
+ "loss": 0.9533,
135
+ "step": 18
136
+ },
137
+ {
138
+ "epoch": 6.470588235294118,
139
+ "grad_norm": 0.9435980319976807,
140
+ "learning_rate": 1e-05,
141
+ "loss": 7.4254,
142
+ "step": 19
143
+ },
144
+ {
145
+ "epoch": 6.9411764705882355,
146
+ "grad_norm": 0.6535025835037231,
147
+ "learning_rate": 0.0,
148
+ "loss": 7.3186,
149
+ "step": 20
150
+ },
151
+ {
152
+ "epoch": 6.9411764705882355,
153
+ "step": 20,
154
+ "total_flos": 6374668143960.0,
155
+ "train_loss": 5.936464631557465,
156
+ "train_runtime": 569.9677,
157
+ "train_samples_per_second": 0.579,
158
+ "train_steps_per_second": 0.035
159
  }
160
  ],
161
  "logging_steps": 1.0,
162
+ "max_steps": 20,
163
  "num_input_tokens_seen": 0,
164
+ "num_train_epochs": 10,
165
  "save_steps": 500,
166
  "stateful_callbacks": {
167
  "TrainerControl": {
 
175
  "attributes": {}
176
  }
177
  },
178
+ "total_flos": 6374668143960.0,
179
  "train_batch_size": 2,
180
  "trial_name": null,
181
  "trial_params": null