ylacombe HF staff commited on
Commit
f2a9eda
1 Parent(s): e033a3e

End of training

Browse files
Files changed (4) hide show
  1. README.md +4 -1
  2. all_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +19 -67
README.md CHANGED
@@ -1,5 +1,8 @@
1
  ---
 
2
  tags:
 
 
3
  - generated_from_trainer
4
  datasets:
5
  - audiofolder
@@ -13,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # musicgen-melody-bella-ciao
15
 
16
- This model is a fine-tuned version of [](https://huggingface.co/) on the audiofolder dataset.
17
 
18
  ## Model description
19
 
 
1
  ---
2
+ base_model: ylacombe/musicgen-melody
3
  tags:
4
+ - text-to-audio
5
+ - patrickvonplaten/bella_ciao
6
  - generated_from_trainer
7
  datasets:
8
  - audiofolder
 
16
 
17
  # musicgen-melody-bella-ciao
18
 
19
+ This model is a fine-tuned version of [ylacombe/musicgen-melody](https://huggingface.co/ylacombe/musicgen-melody) on the PATRICKVONPLATEN/BELLA_CIAO - DEFAULT dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "train_loss": 7.3888854471842444,
4
- "train_runtime": 149.4092,
5
- "train_samples": 30,
6
- "train_samples_per_second": 2.008,
7
- "train_steps_per_second": 2.008
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "train_loss": 8.267948303222656,
4
+ "train_runtime": 72.315,
5
+ "train_samples": 10,
6
+ "train_samples_per_second": 1.383,
7
+ "train_steps_per_second": 1.383
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "train_loss": 7.3888854471842444,
4
- "train_runtime": 149.4092,
5
- "train_samples": 30,
6
- "train_samples_per_second": 2.008,
7
- "train_steps_per_second": 2.008
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "train_loss": 8.267948303222656,
4
+ "train_runtime": 72.315,
5
+ "train_samples": 10,
6
+ "train_samples_per_second": 1.383,
7
+ "train_steps_per_second": 1.383
8
  }
trainer_state.json CHANGED
@@ -3,95 +3,47 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 10.0,
5
  "eval_steps": 1000,
6
- "global_step": 300,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.83,
13
- "learning_rate": 9.2e-07,
14
- "loss": 8.7857,
15
- "step": 25
16
- },
17
- {
18
- "epoch": 1.67,
19
- "learning_rate": 8.366666666666667e-07,
20
- "loss": 7.6115,
21
- "step": 50
22
- },
23
  {
24
  "epoch": 2.5,
25
- "learning_rate": 7.533333333333332e-07,
26
- "loss": 7.3706,
27
- "step": 75
28
- },
29
- {
30
- "epoch": 3.33,
31
- "learning_rate": 6.733333333333333e-07,
32
- "loss": 7.2883,
33
- "step": 100
34
- },
35
- {
36
- "epoch": 4.17,
37
- "learning_rate": 5.9e-07,
38
- "loss": 7.2673,
39
- "step": 125
40
  },
41
  {
42
  "epoch": 5.0,
43
- "learning_rate": 5.066666666666667e-07,
44
- "loss": 7.2174,
45
- "step": 150
46
- },
47
- {
48
- "epoch": 5.83,
49
- "learning_rate": 4.2333333333333334e-07,
50
- "loss": 7.2089,
51
- "step": 175
52
- },
53
- {
54
- "epoch": 6.67,
55
- "learning_rate": 3.4000000000000003e-07,
56
- "loss": 7.1989,
57
- "step": 200
58
  },
59
  {
60
  "epoch": 7.5,
61
- "learning_rate": 2.5666666666666666e-07,
62
- "loss": 7.1801,
63
- "step": 225
64
- },
65
- {
66
- "epoch": 8.33,
67
- "learning_rate": 1.7333333333333332e-07,
68
- "loss": 7.1842,
69
- "step": 250
70
- },
71
- {
72
- "epoch": 9.17,
73
- "learning_rate": 9e-08,
74
- "loss": 7.1852,
75
- "step": 275
76
  },
77
  {
78
  "epoch": 10.0,
79
- "learning_rate": 1e-08,
80
- "loss": 7.1686,
81
- "step": 300
82
  },
83
  {
84
  "epoch": 10.0,
85
- "step": 300,
86
  "total_flos": 0.0,
87
- "train_loss": 7.3888854471842444,
88
- "train_runtime": 149.4092,
89
- "train_samples_per_second": 2.008,
90
- "train_steps_per_second": 2.008
91
  }
92
  ],
93
  "logging_steps": 25,
94
- "max_steps": 300,
95
  "num_input_tokens_seen": 0,
96
  "num_train_epochs": 10,
97
  "save_steps": 500,
 
3
  "best_model_checkpoint": null,
4
  "epoch": 10.0,
5
  "eval_steps": 1000,
6
+ "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 2.5,
13
+ "learning_rate": 3.7999999999999996e-07,
14
+ "loss": 9.1576,
15
+ "step": 25
 
 
 
 
 
 
 
 
 
 
 
 
16
  },
17
  {
18
  "epoch": 5.0,
19
+ "learning_rate": 2.55e-07,
20
+ "loss": 8.3016,
21
+ "step": 50
 
 
 
 
 
 
 
 
 
 
 
 
22
  },
23
  {
24
  "epoch": 7.5,
25
+ "learning_rate": 1.3e-07,
26
+ "loss": 7.9075,
27
+ "step": 75
 
 
 
 
 
 
 
 
 
 
 
 
28
  },
29
  {
30
  "epoch": 10.0,
31
+ "learning_rate": 5e-09,
32
+ "loss": 7.7051,
33
+ "step": 100
34
  },
35
  {
36
  "epoch": 10.0,
37
+ "step": 100,
38
  "total_flos": 0.0,
39
+ "train_loss": 8.267948303222656,
40
+ "train_runtime": 72.315,
41
+ "train_samples_per_second": 1.383,
42
+ "train_steps_per_second": 1.383
43
  }
44
  ],
45
  "logging_steps": 25,
46
+ "max_steps": 100,
47
  "num_input_tokens_seen": 0,
48
  "num_train_epochs": 10,
49
  "save_steps": 500,