sanchit-gandhi HF staff commited on
Commit
d8cc55c
1 Parent(s): 170f60f

Model save

Browse files
README.md CHANGED
@@ -12,8 +12,8 @@ model-index:
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
  should probably proofread and complete it, then remove this comment. -->
14
 
15
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/b8se0vmo)
16
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/b8se0vmo)
17
  # black-eyed-peas-v1-crafted-prompt-3-epochs
18
 
19
  This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on an unknown dataset.
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
  should probably proofread and complete it, then remove this comment. -->
14
 
15
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/8ycxnynu)
16
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/sanchit-gandhi/black-eyed-peas/runs/8ycxnynu)
17
  # black-eyed-peas-v1-crafted-prompt-3-epochs
18
 
19
  This model is a fine-tuned version of [facebook/musicgen-melody-large](https://huggingface.co/facebook/musicgen-melody-large) on an unknown dataset.
adapter_config.json CHANGED
@@ -23,22 +23,22 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "lm_heads.3",
27
- "enc_to_dec_proj",
28
- "lm_heads.0",
29
  "embed_tokens.1",
30
- "k_proj",
 
 
31
  "embed_tokens.3",
 
 
32
  "v_proj",
33
- "lm_heads.2",
34
- "fc2",
35
  "audio_enc_to_dec_proj",
36
- "embed_tokens.2",
37
- "q_proj",
38
- "lm_heads.1",
39
  "out_proj",
40
- "fc1",
41
- "embed_tokens.0"
 
 
42
  ],
43
  "task_type": null,
44
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
26
  "embed_tokens.1",
27
+ "lm_heads.1",
28
+ "fc2",
29
+ "embed_tokens.0",
30
  "embed_tokens.3",
31
+ "lm_heads.0",
32
+ "lm_heads.3",
33
  "v_proj",
34
+ "k_proj",
 
35
  "audio_enc_to_dec_proj",
36
+ "lm_heads.2",
 
 
37
  "out_proj",
38
+ "q_proj",
39
+ "enc_to_dec_proj",
40
+ "embed_tokens.2",
41
+ "fc1"
42
  ],
43
  "task_type": null,
44
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93a31e252da2fa281a7232cb2bc46a7c0fc4409debe64ffbb49f233b9907354b
3
  size 115742888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca435ac5d88714516cc5070507273d647419f9efdd8bcb64d7b743b32d2c6f15
3
  size 115742888
all_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.6879999999999997,
3
+ "total_flos": 231798834079728.0,
4
+ "train_loss": 9.752382596333822,
5
+ "train_runtime": 1792.9741,
6
+ "train_samples": 125,
7
+ "train_samples_per_second": 0.209,
8
+ "train_steps_per_second": 0.012
9
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.6879999999999997,
3
+ "total_flos": 231798834079728.0,
4
+ "train_loss": 9.752382596333822,
5
+ "train_runtime": 1792.9741,
6
+ "train_samples": 125,
7
+ "train_samples_per_second": 0.209,
8
+ "train_steps_per_second": 0.012
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,189 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 2.6879999999999997,
5
+ "eval_steps": 30,
6
+ "global_step": 21,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.128,
13
+ "grad_norm": 1.7382475137710571,
14
+ "learning_rate": 2.857142857142857e-05,
15
+ "loss": 10.1861,
16
+ "step": 1
17
+ },
18
+ {
19
+ "epoch": 0.256,
20
+ "grad_norm": 1.5424667596817017,
21
+ "learning_rate": 2.7142857142857144e-05,
22
+ "loss": 10.0983,
23
+ "step": 2
24
+ },
25
+ {
26
+ "epoch": 0.384,
27
+ "grad_norm": 1.8689937591552734,
28
+ "learning_rate": 2.5714285714285714e-05,
29
+ "loss": 10.133,
30
+ "step": 3
31
+ },
32
+ {
33
+ "epoch": 0.512,
34
+ "grad_norm": 1.9022722244262695,
35
+ "learning_rate": 2.4285714285714288e-05,
36
+ "loss": 10.0471,
37
+ "step": 4
38
+ },
39
+ {
40
+ "epoch": 0.64,
41
+ "grad_norm": 2.0458884239196777,
42
+ "learning_rate": 2.2857142857142858e-05,
43
+ "loss": 9.9922,
44
+ "step": 5
45
+ },
46
+ {
47
+ "epoch": 0.768,
48
+ "grad_norm": 2.3358101844787598,
49
+ "learning_rate": 2.1428571428571428e-05,
50
+ "loss": 10.0411,
51
+ "step": 6
52
+ },
53
+ {
54
+ "epoch": 0.896,
55
+ "grad_norm": 2.354118585586548,
56
+ "learning_rate": 1.9999999999999998e-05,
57
+ "loss": 10.0344,
58
+ "step": 7
59
+ },
60
+ {
61
+ "epoch": 1.024,
62
+ "grad_norm": 2.3863983154296875,
63
+ "learning_rate": 1.8571428571428572e-05,
64
+ "loss": 9.9137,
65
+ "step": 8
66
+ },
67
+ {
68
+ "epoch": 1.152,
69
+ "grad_norm": 2.524012804031372,
70
+ "learning_rate": 1.7142857142857142e-05,
71
+ "loss": 9.8263,
72
+ "step": 9
73
+ },
74
+ {
75
+ "epoch": 1.28,
76
+ "grad_norm": 2.6917295455932617,
77
+ "learning_rate": 1.5714285714285715e-05,
78
+ "loss": 9.7679,
79
+ "step": 10
80
+ },
81
+ {
82
+ "epoch": 1.408,
83
+ "grad_norm": 2.6992530822753906,
84
+ "learning_rate": 1.4285714285714285e-05,
85
+ "loss": 9.6647,
86
+ "step": 11
87
+ },
88
+ {
89
+ "epoch": 1.536,
90
+ "grad_norm": 2.9822065830230713,
91
+ "learning_rate": 1.2857142857142857e-05,
92
+ "loss": 9.6447,
93
+ "step": 12
94
+ },
95
+ {
96
+ "epoch": 1.6640000000000001,
97
+ "grad_norm": 3.070004463195801,
98
+ "learning_rate": 1.1428571428571429e-05,
99
+ "loss": 9.6797,
100
+ "step": 13
101
+ },
102
+ {
103
+ "epoch": 1.792,
104
+ "grad_norm": 3.1922192573547363,
105
+ "learning_rate": 9.999999999999999e-06,
106
+ "loss": 9.5573,
107
+ "step": 14
108
+ },
109
+ {
110
+ "epoch": 1.92,
111
+ "grad_norm": 3.1647372245788574,
112
+ "learning_rate": 8.571428571428571e-06,
113
+ "loss": 9.5216,
114
+ "step": 15
115
+ },
116
+ {
117
+ "epoch": 2.048,
118
+ "grad_norm": 3.2566683292388916,
119
+ "learning_rate": 7.142857142857143e-06,
120
+ "loss": 9.5464,
121
+ "step": 16
122
+ },
123
+ {
124
+ "epoch": 2.176,
125
+ "grad_norm": 3.1021530628204346,
126
+ "learning_rate": 5.7142857142857145e-06,
127
+ "loss": 9.4385,
128
+ "step": 17
129
+ },
130
+ {
131
+ "epoch": 2.304,
132
+ "grad_norm": 3.345439910888672,
133
+ "learning_rate": 4.2857142857142855e-06,
134
+ "loss": 9.4269,
135
+ "step": 18
136
+ },
137
+ {
138
+ "epoch": 2.432,
139
+ "grad_norm": 3.5849218368530273,
140
+ "learning_rate": 2.8571428571428573e-06,
141
+ "loss": 9.4999,
142
+ "step": 19
143
+ },
144
+ {
145
+ "epoch": 2.56,
146
+ "grad_norm": 3.8040404319763184,
147
+ "learning_rate": 1.4285714285714286e-06,
148
+ "loss": 9.44,
149
+ "step": 20
150
+ },
151
+ {
152
+ "epoch": 2.6879999999999997,
153
+ "grad_norm": 3.2971229553222656,
154
+ "learning_rate": 0.0,
155
+ "loss": 9.3401,
156
+ "step": 21
157
+ },
158
+ {
159
+ "epoch": 2.6879999999999997,
160
+ "step": 21,
161
+ "total_flos": 231798834079728.0,
162
+ "train_loss": 9.752382596333822,
163
+ "train_runtime": 1792.9741,
164
+ "train_samples_per_second": 0.209,
165
+ "train_steps_per_second": 0.012
166
+ }
167
+ ],
168
+ "logging_steps": 1.0,
169
+ "max_steps": 21,
170
+ "num_input_tokens_seen": 0,
171
+ "num_train_epochs": 3,
172
+ "save_steps": 500,
173
+ "stateful_callbacks": {
174
+ "TrainerControl": {
175
+ "args": {
176
+ "should_epoch_stop": false,
177
+ "should_evaluate": false,
178
+ "should_log": false,
179
+ "should_save": false,
180
+ "should_training_stop": false
181
+ },
182
+ "attributes": {}
183
+ }
184
+ },
185
+ "total_flos": 231798834079728.0,
186
+ "train_batch_size": 1,
187
+ "trial_name": null,
188
+ "trial_params": null
189
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53ce71f30a1d77dc920e747b594dbf3462090ccf044984d2de31fdba1edd5120
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f6742ea29acfe8964c1d78aabaa63ecf56038b4206fa71f2d9cb1d5768f6ea8
3
  size 5368