MeedoSam commited on
Commit
5a6aed9
1 Parent(s): 5a86835

Uploaded checkpoint-25000

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1728956bca0b9356ae29462b37ac34654e1484ea8ef2b11bb5247ae5eda898c8
3
  size 119975656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04775532bd2e07bf11ebd2051856f8ff3cd14a3b1602476c8cd878dc55108be6
3
  size 119975656
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e40cd6ba11d9a0ceaea16d7c58dce9d059685099ee9172ed66890d5851cdfc45
3
  size 60477396
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:945240ab0506a0e4e3b0b5cf5c427a1d717779a803ea92962e3be770f3863ecd
3
  size 60477396
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2411394ac968a82b73f6de27417329addc7551a6595e6f8e40c25c5f9f504b1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cc6d246693c4c7085670610c3cb24611d2a43f9c316a1c2833732f83270fcef
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:767cf16b1af6a1442d6e9081070ae709d5786da93d28d3f0bf69c41bc72162ac
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05c0c42e10d78b34ca2f7aaf9f72ec3bcc915774ed80b66aaaec9d2cfc880dd7
3
  size 1064
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5625,
5
  "eval_steps": 2500,
6
- "global_step": 22500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -233,6 +233,35 @@
233
  "eval_samples_per_second": 4.959,
234
  "eval_steps_per_second": 4.959,
235
  "step": 22500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
236
  }
237
  ],
238
  "logging_steps": 1000,
@@ -240,7 +269,7 @@
240
  "num_input_tokens_seen": 0,
241
  "num_train_epochs": 1,
242
  "save_steps": 2500,
243
- "total_flos": 3.6229783486464e+17,
244
  "train_batch_size": 1,
245
  "trial_name": null,
246
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.625,
5
  "eval_steps": 2500,
6
+ "global_step": 25000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
233
  "eval_samples_per_second": 4.959,
234
  "eval_steps_per_second": 4.959,
235
  "step": 22500
236
+ },
237
+ {
238
+ "epoch": 0.57,
239
+ "grad_norm": 6.0290374755859375,
240
+ "learning_rate": 6.961739130434784e-06,
241
+ "loss": 1.3187,
242
+ "step": 23000
243
+ },
244
+ {
245
+ "epoch": 0.6,
246
+ "grad_norm": 2.862253189086914,
247
+ "learning_rate": 6.382028985507247e-06,
248
+ "loss": 1.321,
249
+ "step": 24000
250
+ },
251
+ {
252
+ "epoch": 0.62,
253
+ "grad_norm": 2.9182982444763184,
254
+ "learning_rate": 5.80231884057971e-06,
255
+ "loss": 1.3157,
256
+ "step": 25000
257
+ },
258
+ {
259
+ "epoch": 0.62,
260
+ "eval_loss": 1.2969852685928345,
261
+ "eval_runtime": 201.2648,
262
+ "eval_samples_per_second": 4.969,
263
+ "eval_steps_per_second": 4.969,
264
+ "step": 25000
265
  }
266
  ],
267
  "logging_steps": 1000,
 
269
  "num_input_tokens_seen": 0,
270
  "num_train_epochs": 1,
271
  "save_steps": 2500,
272
+ "total_flos": 4.025531498496e+17,
273
  "train_batch_size": 1,
274
  "trial_name": null,
275
  "trial_params": null