sanchit-gandhi HF staff commited on
Commit
16bdf08
1 Parent(s): d8cc55c

End of training

Browse files
Files changed (5) hide show
  1. README.md +7 -1
  2. all_results.json +12 -5
  3. eval_results.json +10 -0
  4. train_results.json +5 -5
  5. trainer_state.json +48 -48
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: cc-by-nc-4.0
3
  library_name: peft
4
  tags:
 
 
5
  - generated_from_trainer
6
  base_model: facebook/musicgen-melody-large
7
  model-index:
@@ -16,7 +18,11 @@ should probably proofread and complete it, then remove this comment. -->
16
  [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/8ycxnynu)
17
  # black-eyed-peas-v1-crafted-prompt-3-epochs
18
 
19
- This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on an unknown dataset.
 
 
 
 
20
 
21
  ## Model description
22
 
 
2
  license: cc-by-nc-4.0
3
  library_name: peft
4
  tags:
5
+ - text-to-audio
6
+ - sweet-dreambooths/black-eyed-peas-v1
7
  - generated_from_trainer
8
  base_model: facebook/musicgen-melody-large
9
  model-index:
 
18
  [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/8ycxnynu)
19
  # black-eyed-peas-v1-crafted-prompt-3-epochs
20
 
21
+ This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on the SWEET-DREAMBOOTHS/BLACK-EYED-PEAS-V1 - DEFAULT dataset.
22
+ It achieves the following results on the evaluation set:
23
+ - Loss: 3.0997
24
+ - Text Cosine Sim: 0.4173
25
+ - Audio Cosine Sim: 0.6327
26
 
27
  ## Model description
28
 
all_results.json CHANGED
@@ -1,9 +1,16 @@
1
  {
2
  "epoch": 2.6879999999999997,
3
- "total_flos": 231798834079728.0,
4
- "train_loss": 9.752382596333822,
5
- "train_runtime": 1792.9741,
 
 
 
 
 
 
 
6
  "train_samples": 125,
7
- "train_samples_per_second": 0.209,
8
- "train_steps_per_second": 0.012
9
  }
 
1
  {
2
  "epoch": 2.6879999999999997,
3
+ "eval_audio_cosine_sim": 0.632674515247345,
4
+ "eval_loss": 3.0996882915496826,
5
+ "eval_runtime": 2067.9427,
6
+ "eval_samples": 12,
7
+ "eval_samples_per_second": 0.006,
8
+ "eval_steps_per_second": 0.006,
9
+ "eval_text_cosine_sim": 0.4172757863998413,
10
+ "total_flos": 284409215227248.0,
11
+ "train_loss": 9.75504275730678,
12
+ "train_runtime": 2860.8048,
13
  "train_samples": 125,
14
+ "train_samples_per_second": 0.131,
15
+ "train_steps_per_second": 0.007
16
  }
eval_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.6879999999999997,
3
+ "eval_audio_cosine_sim": 0.632674515247345,
4
+ "eval_loss": 3.0996882915496826,
5
+ "eval_runtime": 2067.9427,
6
+ "eval_samples": 12,
7
+ "eval_samples_per_second": 0.006,
8
+ "eval_steps_per_second": 0.006,
9
+ "eval_text_cosine_sim": 0.4172757863998413
10
+ }
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 2.6879999999999997,
3
- "total_flos": 231798834079728.0,
4
- "train_loss": 9.752382596333822,
5
- "train_runtime": 1792.9741,
6
  "train_samples": 125,
7
- "train_samples_per_second": 0.209,
8
- "train_steps_per_second": 0.012
9
  }
 
1
  {
2
  "epoch": 2.6879999999999997,
3
+ "total_flos": 284409215227248.0,
4
+ "train_loss": 9.75504275730678,
5
+ "train_runtime": 2860.8048,
6
  "train_samples": 125,
7
+ "train_samples_per_second": 0.131,
8
+ "train_steps_per_second": 0.007
9
  }
trainer_state.json CHANGED
@@ -10,159 +10,159 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.128,
13
- "grad_norm": 1.7382475137710571,
14
  "learning_rate": 2.857142857142857e-05,
15
- "loss": 10.1861,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.256,
20
- "grad_norm": 1.5424667596817017,
21
  "learning_rate": 2.7142857142857144e-05,
22
- "loss": 10.0983,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 0.384,
27
- "grad_norm": 1.8689937591552734,
28
  "learning_rate": 2.5714285714285714e-05,
29
- "loss": 10.133,
30
  "step": 3
31
  },
32
  {
33
  "epoch": 0.512,
34
- "grad_norm": 1.9022722244262695,
35
  "learning_rate": 2.4285714285714288e-05,
36
- "loss": 10.0471,
37
  "step": 4
38
  },
39
  {
40
  "epoch": 0.64,
41
- "grad_norm": 2.0458884239196777,
42
  "learning_rate": 2.2857142857142858e-05,
43
- "loss": 9.9922,
44
  "step": 5
45
  },
46
  {
47
  "epoch": 0.768,
48
- "grad_norm": 2.3358101844787598,
49
  "learning_rate": 2.1428571428571428e-05,
50
- "loss": 10.0411,
51
  "step": 6
52
  },
53
  {
54
  "epoch": 0.896,
55
- "grad_norm": 2.354118585586548,
56
  "learning_rate": 1.9999999999999998e-05,
57
- "loss": 10.0344,
58
  "step": 7
59
  },
60
  {
61
  "epoch": 1.024,
62
- "grad_norm": 2.3863983154296875,
63
  "learning_rate": 1.8571428571428572e-05,
64
- "loss": 9.9137,
65
  "step": 8
66
  },
67
  {
68
  "epoch": 1.152,
69
- "grad_norm": 2.524012804031372,
70
  "learning_rate": 1.7142857142857142e-05,
71
- "loss": 9.8263,
72
  "step": 9
73
  },
74
  {
75
  "epoch": 1.28,
76
- "grad_norm": 2.6917295455932617,
77
  "learning_rate": 1.5714285714285715e-05,
78
- "loss": 9.7679,
79
  "step": 10
80
  },
81
  {
82
  "epoch": 1.408,
83
- "grad_norm": 2.6992530822753906,
84
  "learning_rate": 1.4285714285714285e-05,
85
- "loss": 9.6647,
86
  "step": 11
87
  },
88
  {
89
  "epoch": 1.536,
90
- "grad_norm": 2.9822065830230713,
91
  "learning_rate": 1.2857142857142857e-05,
92
- "loss": 9.6447,
93
  "step": 12
94
  },
95
  {
96
  "epoch": 1.6640000000000001,
97
- "grad_norm": 3.070004463195801,
98
  "learning_rate": 1.1428571428571429e-05,
99
- "loss": 9.6797,
100
  "step": 13
101
  },
102
  {
103
  "epoch": 1.792,
104
- "grad_norm": 3.1922192573547363,
105
  "learning_rate": 9.999999999999999e-06,
106
- "loss": 9.5573,
107
  "step": 14
108
  },
109
  {
110
  "epoch": 1.92,
111
- "grad_norm": 3.1647372245788574,
112
  "learning_rate": 8.571428571428571e-06,
113
- "loss": 9.5216,
114
  "step": 15
115
  },
116
  {
117
  "epoch": 2.048,
118
- "grad_norm": 3.2566683292388916,
119
  "learning_rate": 7.142857142857143e-06,
120
- "loss": 9.5464,
121
  "step": 16
122
  },
123
  {
124
  "epoch": 2.176,
125
- "grad_norm": 3.1021530628204346,
126
  "learning_rate": 5.7142857142857145e-06,
127
- "loss": 9.4385,
128
  "step": 17
129
  },
130
  {
131
  "epoch": 2.304,
132
- "grad_norm": 3.345439910888672,
133
  "learning_rate": 4.2857142857142855e-06,
134
- "loss": 9.4269,
135
  "step": 18
136
  },
137
  {
138
  "epoch": 2.432,
139
- "grad_norm": 3.5849218368530273,
140
  "learning_rate": 2.8571428571428573e-06,
141
- "loss": 9.4999,
142
  "step": 19
143
  },
144
  {
145
  "epoch": 2.56,
146
- "grad_norm": 3.8040404319763184,
147
  "learning_rate": 1.4285714285714286e-06,
148
- "loss": 9.44,
149
  "step": 20
150
  },
151
  {
152
  "epoch": 2.6879999999999997,
153
- "grad_norm": 3.2971229553222656,
154
  "learning_rate": 0.0,
155
- "loss": 9.3401,
156
  "step": 21
157
  },
158
  {
159
  "epoch": 2.6879999999999997,
160
  "step": 21,
161
- "total_flos": 231798834079728.0,
162
- "train_loss": 9.752382596333822,
163
- "train_runtime": 1792.9741,
164
- "train_samples_per_second": 0.209,
165
- "train_steps_per_second": 0.012
166
  }
167
  ],
168
  "logging_steps": 1.0,
@@ -182,7 +182,7 @@
182
  "attributes": {}
183
  }
184
  },
185
- "total_flos": 231798834079728.0,
186
  "train_batch_size": 1,
187
  "trial_name": null,
188
  "trial_params": null
 
10
  "log_history": [
11
  {
12
  "epoch": 0.128,
13
+ "grad_norm": 1.7210274934768677,
14
  "learning_rate": 2.857142857142857e-05,
15
+ "loss": 10.176,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.256,
20
+ "grad_norm": 1.5320605039596558,
21
  "learning_rate": 2.7142857142857144e-05,
22
+ "loss": 10.1016,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 0.384,
27
+ "grad_norm": 1.87909734249115,
28
  "learning_rate": 2.5714285714285714e-05,
29
+ "loss": 10.1459,
30
  "step": 3
31
  },
32
  {
33
  "epoch": 0.512,
34
+ "grad_norm": 1.8966753482818604,
35
  "learning_rate": 2.4285714285714288e-05,
36
+ "loss": 10.0505,
37
  "step": 4
38
  },
39
  {
40
  "epoch": 0.64,
41
+ "grad_norm": 2.0056731700897217,
42
  "learning_rate": 2.2857142857142858e-05,
43
+ "loss": 9.9816,
44
  "step": 5
45
  },
46
  {
47
  "epoch": 0.768,
48
+ "grad_norm": 2.313743829727173,
49
  "learning_rate": 2.1428571428571428e-05,
50
+ "loss": 10.0497,
51
  "step": 6
52
  },
53
  {
54
  "epoch": 0.896,
55
+ "grad_norm": 2.3521242141723633,
56
  "learning_rate": 1.9999999999999998e-05,
57
+ "loss": 10.0357,
58
  "step": 7
59
  },
60
  {
61
  "epoch": 1.024,
62
+ "grad_norm": 2.3931469917297363,
63
  "learning_rate": 1.8571428571428572e-05,
64
+ "loss": 9.918,
65
  "step": 8
66
  },
67
  {
68
  "epoch": 1.152,
69
+ "grad_norm": 2.519587516784668,
70
  "learning_rate": 1.7142857142857142e-05,
71
+ "loss": 9.8211,
72
  "step": 9
73
  },
74
  {
75
  "epoch": 1.28,
76
+ "grad_norm": 2.6767983436584473,
77
  "learning_rate": 1.5714285714285715e-05,
78
+ "loss": 9.7817,
79
  "step": 10
80
  },
81
  {
82
  "epoch": 1.408,
83
+ "grad_norm": 2.6999528408050537,
84
  "learning_rate": 1.4285714285714285e-05,
85
+ "loss": 9.6886,
86
  "step": 11
87
  },
88
  {
89
  "epoch": 1.536,
90
+ "grad_norm": 3.005337953567505,
91
  "learning_rate": 1.2857142857142857e-05,
92
+ "loss": 9.6439,
93
  "step": 12
94
  },
95
  {
96
  "epoch": 1.6640000000000001,
97
+ "grad_norm": 3.042705774307251,
98
  "learning_rate": 1.1428571428571429e-05,
99
+ "loss": 9.6661,
100
  "step": 13
101
  },
102
  {
103
  "epoch": 1.792,
104
+ "grad_norm": 3.1823525428771973,
105
  "learning_rate": 9.999999999999999e-06,
106
+ "loss": 9.5694,
107
  "step": 14
108
  },
109
  {
110
  "epoch": 1.92,
111
+ "grad_norm": 3.1568336486816406,
112
  "learning_rate": 8.571428571428571e-06,
113
+ "loss": 9.5277,
114
  "step": 15
115
  },
116
  {
117
  "epoch": 2.048,
118
+ "grad_norm": 3.230482339859009,
119
  "learning_rate": 7.142857142857143e-06,
120
+ "loss": 9.5726,
121
  "step": 16
122
  },
123
  {
124
  "epoch": 2.176,
125
+ "grad_norm": 3.065131425857544,
126
  "learning_rate": 5.7142857142857145e-06,
127
+ "loss": 9.4275,
128
  "step": 17
129
  },
130
  {
131
  "epoch": 2.304,
132
+ "grad_norm": 3.3117969036102295,
133
  "learning_rate": 4.2857142857142855e-06,
134
+ "loss": 9.4209,
135
  "step": 18
136
  },
137
  {
138
  "epoch": 2.432,
139
+ "grad_norm": 3.5407657623291016,
140
  "learning_rate": 2.8571428571428573e-06,
141
+ "loss": 9.4978,
142
  "step": 19
143
  },
144
  {
145
  "epoch": 2.56,
146
+ "grad_norm": 3.7619757652282715,
147
  "learning_rate": 1.4285714285714286e-06,
148
+ "loss": 9.4477,
149
  "step": 20
150
  },
151
  {
152
  "epoch": 2.6879999999999997,
153
+ "grad_norm": 3.2933194637298584,
154
  "learning_rate": 0.0,
155
+ "loss": 9.3319,
156
  "step": 21
157
  },
158
  {
159
  "epoch": 2.6879999999999997,
160
  "step": 21,
161
+ "total_flos": 284409215227248.0,
162
+ "train_loss": 9.75504275730678,
163
+ "train_runtime": 2860.8048,
164
+ "train_samples_per_second": 0.131,
165
+ "train_steps_per_second": 0.007
166
  }
167
  ],
168
  "logging_steps": 1.0,
 
182
  "attributes": {}
183
  }
184
  },
185
+ "total_flos": 284409215227248.0,
186
  "train_batch_size": 1,
187
  "trial_name": null,
188
  "trial_params": null