TachyHealthResearch commited on
Commit
d82f6b3
1 Parent(s): c44c6e4

Training in progress, step 70, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e219836db331fb2c22e167af2c158d700560aae27dc6a75c160dae363c629cd1
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a3a9ed1385ba2a9486987fb064d61e322c4b33a584269d83c319b3e60a9b07
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d088274e6e4b583afe59f323ed350eaf66dca870661c394c8ede6293508ee82e
3
  size 42545748
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33e7221101e4a7fade7ddd4b88da7c505da46d19376708b1c05f8d12428b2803
3
  size 42545748
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:babf9cef0f970e1cd241f9533a5b0bc052a39fc9df617e7f31209a9691bd42d1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:557e474a226d303e26d6758a2eb18bb0bbe3b1a451146f9953c40e79b727f273
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87f5541cd8b8cc2355cb28b7b43b87c2e735f1841d8477f8ed4c15392845734c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1723a4b1c943236de3935bcf77e35b80aec5d8ffd41a734f2052202a2aabea88
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.024,
5
  "eval_steps": 1000,
6
- "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -367,13 +367,73 @@
367
  "learning_rate": 8.421052631578948e-05,
368
  "loss": 1.5684,
369
  "step": 60
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
370
  }
371
  ],
372
  "logging_steps": 1,
373
  "max_steps": 100,
374
  "num_train_epochs": 1,
375
  "save_steps": 10,
376
- "total_flos": 3532725037301760.0,
377
  "trial_name": null,
378
  "trial_params": null
379
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.028,
5
  "eval_steps": 1000,
6
+ "global_step": 70,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
367
  "learning_rate": 8.421052631578948e-05,
368
  "loss": 1.5684,
369
  "step": 60
370
+ },
371
+ {
372
+ "epoch": 0.02,
373
+ "learning_rate": 8.210526315789474e-05,
374
+ "loss": 1.6735,
375
+ "step": 61
376
+ },
377
+ {
378
+ "epoch": 0.02,
379
+ "learning_rate": 8e-05,
380
+ "loss": 1.5827,
381
+ "step": 62
382
+ },
383
+ {
384
+ "epoch": 0.03,
385
+ "learning_rate": 7.789473684210526e-05,
386
+ "loss": 1.5755,
387
+ "step": 63
388
+ },
389
+ {
390
+ "epoch": 0.03,
391
+ "learning_rate": 7.578947368421054e-05,
392
+ "loss": 1.3339,
393
+ "step": 64
394
+ },
395
+ {
396
+ "epoch": 0.03,
397
+ "learning_rate": 7.368421052631579e-05,
398
+ "loss": 1.4373,
399
+ "step": 65
400
+ },
401
+ {
402
+ "epoch": 0.03,
403
+ "learning_rate": 7.157894736842105e-05,
404
+ "loss": 1.9484,
405
+ "step": 66
406
+ },
407
+ {
408
+ "epoch": 0.03,
409
+ "learning_rate": 6.947368421052632e-05,
410
+ "loss": 1.5517,
411
+ "step": 67
412
+ },
413
+ {
414
+ "epoch": 0.03,
415
+ "learning_rate": 6.736842105263159e-05,
416
+ "loss": 1.5427,
417
+ "step": 68
418
+ },
419
+ {
420
+ "epoch": 0.03,
421
+ "learning_rate": 6.526315789473685e-05,
422
+ "loss": 1.689,
423
+ "step": 69
424
+ },
425
+ {
426
+ "epoch": 0.03,
427
+ "learning_rate": 6.31578947368421e-05,
428
+ "loss": 1.5722,
429
+ "step": 70
430
  }
431
  ],
432
  "logging_steps": 1,
433
  "max_steps": 100,
434
  "num_train_epochs": 1,
435
  "save_steps": 10,
436
+ "total_flos": 4233108315045888.0,
437
  "trial_name": null,
438
  "trial_params": null
439
  }