ylacombe HF staff commited on
Commit
053f8fb
1 Parent(s): c616dd7

End of training

Browse files
Files changed (4) hide show
  1. README.md +4 -1
  2. all_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +76 -22
README.md CHANGED
@@ -1,5 +1,8 @@
1
  ---
 
2
  tags:
 
 
3
  - generated_from_trainer
4
  datasets:
5
  - audiofolder
@@ -13,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # musicgen-melody-bella-ciao
15
 
16
- This model is a fine-tuned version of [](https://huggingface.co/) on the audiofolder dataset.
17
 
18
  ## Model description
19
 
 
1
  ---
2
+ base_model: ylacombe/musicgen-melody
3
  tags:
4
+ - text-to-audio
5
+ - patrickvonplaten/bella_ciao
6
  - generated_from_trainer
7
  datasets:
8
  - audiofolder
 
16
 
17
  # musicgen-melody-bella-ciao
18
 
19
+ This model is a fine-tuned version of [ylacombe/musicgen-melody](https://huggingface.co/ylacombe/musicgen-melody) on the PATRICKVONPLATEN/BELLA_CIAO - DEFAULT dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "train_loss": 7.140205179850261,
4
- "train_runtime": 114.8228,
5
  "train_samples": 30,
6
- "train_samples_per_second": 2.613,
7
- "train_steps_per_second": 1.306
8
  }
 
1
  {
2
+ "epoch": 25.0,
3
+ "train_loss": 7.2796097819010415,
4
+ "train_runtime": 437.882,
5
  "train_samples": 30,
6
+ "train_samples_per_second": 1.713,
7
+ "train_steps_per_second": 0.856
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "train_loss": 7.140205179850261,
4
- "train_runtime": 114.8228,
5
  "train_samples": 30,
6
- "train_samples_per_second": 2.613,
7
- "train_steps_per_second": 1.306
8
  }
 
1
  {
2
+ "epoch": 25.0,
3
+ "train_loss": 7.2796097819010415,
4
+ "train_runtime": 437.882,
5
  "train_samples": 30,
6
+ "train_samples_per_second": 1.713,
7
+ "train_steps_per_second": 0.856
8
  }
trainer_state.json CHANGED
@@ -1,63 +1,117 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
  "eval_steps": 1000,
6
- "global_step": 150,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.67,
13
- "learning_rate": 8.333333333333334e-06,
14
- "loss": 7.5038,
15
  "step": 25
16
  },
17
  {
18
  "epoch": 3.33,
19
- "learning_rate": 6.666666666666667e-06,
20
- "loss": 7.1421,
21
  "step": 50
22
  },
23
  {
24
  "epoch": 5.0,
25
- "learning_rate": 5e-06,
26
- "loss": 7.1034,
27
  "step": 75
28
  },
29
  {
30
  "epoch": 6.67,
31
- "learning_rate": 3.3333333333333333e-06,
32
- "loss": 7.0666,
33
  "step": 100
34
  },
35
  {
36
  "epoch": 8.33,
37
- "learning_rate": 1.6666666666666667e-06,
38
- "loss": 7.0238,
39
  "step": 125
40
  },
41
  {
42
  "epoch": 10.0,
43
- "learning_rate": 0.0,
44
- "loss": 7.0015,
45
  "step": 150
46
  },
47
  {
48
- "epoch": 10.0,
49
- "step": 150,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
50
  "total_flos": 0.0,
51
- "train_loss": 7.140205179850261,
52
- "train_runtime": 114.8228,
53
- "train_samples_per_second": 2.613,
54
- "train_steps_per_second": 1.306
55
  }
56
  ],
57
  "logging_steps": 25,
58
- "max_steps": 150,
59
  "num_input_tokens_seen": 0,
60
- "num_train_epochs": 10,
61
  "save_steps": 500,
62
  "total_flos": 0.0,
63
  "train_batch_size": 2,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 25.0,
5
  "eval_steps": 1000,
6
+ "global_step": 375,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.67,
13
+ "learning_rate": 9.36e-07,
14
+ "loss": 8.5683,
15
  "step": 25
16
  },
17
  {
18
  "epoch": 3.33,
19
+ "learning_rate": 8.693333333333333e-07,
20
+ "loss": 7.5028,
21
  "step": 50
22
  },
23
  {
24
  "epoch": 5.0,
25
+ "learning_rate": 8.026666666666667e-07,
26
+ "loss": 7.293,
27
  "step": 75
28
  },
29
  {
30
  "epoch": 6.67,
31
+ "learning_rate": 7.359999999999999e-07,
32
+ "loss": 7.2316,
33
  "step": 100
34
  },
35
  {
36
  "epoch": 8.33,
37
+ "learning_rate": 6.693333333333333e-07,
38
+ "loss": 7.1945,
39
  "step": 125
40
  },
41
  {
42
  "epoch": 10.0,
43
+ "learning_rate": 6.026666666666667e-07,
44
+ "loss": 7.178,
45
  "step": 150
46
  },
47
  {
48
+ "epoch": 11.67,
49
+ "learning_rate": 5.36e-07,
50
+ "loss": 7.176,
51
+ "step": 175
52
+ },
53
+ {
54
+ "epoch": 13.33,
55
+ "learning_rate": 4.693333333333333e-07,
56
+ "loss": 7.1478,
57
+ "step": 200
58
+ },
59
+ {
60
+ "epoch": 15.0,
61
+ "learning_rate": 4.0799999999999995e-07,
62
+ "loss": 7.1358,
63
+ "step": 225
64
+ },
65
+ {
66
+ "epoch": 16.67,
67
+ "learning_rate": 3.413333333333333e-07,
68
+ "loss": 7.154,
69
+ "step": 250
70
+ },
71
+ {
72
+ "epoch": 18.33,
73
+ "learning_rate": 2.7466666666666664e-07,
74
+ "loss": 7.1035,
75
+ "step": 275
76
+ },
77
+ {
78
+ "epoch": 20.0,
79
+ "learning_rate": 2.0799999999999998e-07,
80
+ "loss": 7.1441,
81
+ "step": 300
82
+ },
83
+ {
84
+ "epoch": 21.67,
85
+ "learning_rate": 1.4133333333333333e-07,
86
+ "loss": 7.1239,
87
+ "step": 325
88
+ },
89
+ {
90
+ "epoch": 23.33,
91
+ "learning_rate": 7.466666666666667e-08,
92
+ "loss": 7.1274,
93
+ "step": 350
94
+ },
95
+ {
96
+ "epoch": 25.0,
97
+ "learning_rate": 8e-09,
98
+ "loss": 7.1136,
99
+ "step": 375
100
+ },
101
+ {
102
+ "epoch": 25.0,
103
+ "step": 375,
104
  "total_flos": 0.0,
105
+ "train_loss": 7.2796097819010415,
106
+ "train_runtime": 437.882,
107
+ "train_samples_per_second": 1.713,
108
+ "train_steps_per_second": 0.856
109
  }
110
  ],
111
  "logging_steps": 25,
112
+ "max_steps": 375,
113
  "num_input_tokens_seen": 0,
114
+ "num_train_epochs": 25,
115
  "save_steps": 500,
116
  "total_flos": 0.0,
117
  "train_batch_size": 2,