polejowska commited on
Commit
c692c7e
1 Parent(s): 4a69ef1

End of training

Browse files
runs/Feb28_17-52-06_7c779bfb7013/events.out.tfevents.1677606732.7c779bfb7013.343.8 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2620daea2fcc95077507cc9936f97d36567df7d216e83d3e7c6f94ef4eb83fb1
3
- size 6672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7200fb45c44e48bf44b411cce26f438d34e84dd1de1ec0c47c02652fb2e4761
3
+ size 7026
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 20.0,
5
- "global_step": 1880,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -288,18 +288,88 @@
288
  "step": 1880
289
  },
290
  {
291
- "epoch": 20.0,
292
- "step": 1880,
293
- "total_flos": 7.1683864704e+18,
294
- "train_loss": 0.5789503787426238,
295
- "train_runtime": 1191.4496,
296
- "train_samples_per_second": 12.59,
297
- "train_steps_per_second": 1.578
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
298
  }
299
  ],
300
- "max_steps": 1880,
301
- "num_train_epochs": 20,
302
- "total_flos": 7.1683864704e+18,
303
  "trial_name": null,
304
  "trial_params": null
305
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 25.0,
5
+ "global_step": 2350,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
288
  "step": 1880
289
  },
290
  {
291
+ "epoch": 21.0,
292
+ "learning_rate": 1.6000000000000003e-05,
293
+ "loss": 2.2906,
294
+ "step": 1974
295
+ },
296
+ {
297
+ "epoch": 21.0,
298
+ "eval_loss": 1.734320878982544,
299
+ "eval_runtime": 34.5789,
300
+ "eval_samples_per_second": 5.784,
301
+ "eval_steps_per_second": 0.723,
302
+ "step": 1974
303
+ },
304
+ {
305
+ "epoch": 22.0,
306
+ "learning_rate": 1.2e-05,
307
+ "loss": 2.2492,
308
+ "step": 2068
309
+ },
310
+ {
311
+ "epoch": 22.0,
312
+ "eval_loss": 1.7080261707305908,
313
+ "eval_runtime": 35.1218,
314
+ "eval_samples_per_second": 5.694,
315
+ "eval_steps_per_second": 0.712,
316
+ "step": 2068
317
+ },
318
+ {
319
+ "epoch": 23.0,
320
+ "learning_rate": 8.000000000000001e-06,
321
+ "loss": 2.2516,
322
+ "step": 2162
323
+ },
324
+ {
325
+ "epoch": 23.0,
326
+ "eval_loss": 1.718016505241394,
327
+ "eval_runtime": 34.8144,
328
+ "eval_samples_per_second": 5.745,
329
+ "eval_steps_per_second": 0.718,
330
+ "step": 2162
331
+ },
332
+ {
333
+ "epoch": 24.0,
334
+ "learning_rate": 4.000000000000001e-06,
335
+ "loss": 2.2574,
336
+ "step": 2256
337
+ },
338
+ {
339
+ "epoch": 24.0,
340
+ "eval_loss": 1.7081444263458252,
341
+ "eval_runtime": 34.6174,
342
+ "eval_samples_per_second": 5.777,
343
+ "eval_steps_per_second": 0.722,
344
+ "step": 2256
345
+ },
346
+ {
347
+ "epoch": 25.0,
348
+ "learning_rate": 0.0,
349
+ "loss": 2.2508,
350
+ "step": 2350
351
+ },
352
+ {
353
+ "epoch": 25.0,
354
+ "eval_loss": 1.7065184116363525,
355
+ "eval_runtime": 34.9055,
356
+ "eval_samples_per_second": 5.73,
357
+ "eval_steps_per_second": 0.716,
358
+ "step": 2350
359
+ },
360
+ {
361
+ "epoch": 25.0,
362
+ "step": 2350,
363
+ "total_flos": 8.960483088e+18,
364
+ "train_loss": 0.45198433734001,
365
+ "train_runtime": 1195.2772,
366
+ "train_samples_per_second": 15.687,
367
+ "train_steps_per_second": 1.966
368
  }
369
  ],
370
+ "max_steps": 2350,
371
+ "num_train_epochs": 25,
372
+ "total_flos": 8.960483088e+18,
373
  "trial_name": null,
374
  "trial_params": null
375
  }