ncbateman commited on
Commit
24c0b40
·
verified ·
1 Parent(s): 313c644

Training in progress, step 770, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:560166bd58797be34a5a1006e32be8d9d7bdd6e8139374eec22dd6b030c09335
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a27ac3e1ec7d35dbea0ec3b749056abc8d7add31611980aa12634912c331b3e
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bcb1129b7246e53076259c323b591293fbe3c9a50fd35601ccc934945096be6
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2554f05f98e629fa96b10b8d45a8fd3ca22fb76f1ef5482b6601045564c6b8
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc3fad3909fb536f4d0d7737147157c83d6378be43badc6330cb993db1a38d1e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03dbd3ca99b04175952be4801caaa60aa6bc88d41389058fe0bc17432ac48c89
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:117b21438fb9f77af4ac0954437849c611bcc84854c07120ecb52f05f7373ae0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2014e732464a9f8815060f53131de6c0ff6b56b6305dcffb1856efbb56d78b5c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9899708832093174,
5
  "eval_steps": 386,
6
- "global_step": 765,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5378,6 +5378,41 @@
5378
  "learning_rate": 9.155915935223121e-05,
5379
  "loss": 0.8196,
5380
  "step": 765
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5381
  }
5382
  ],
5383
  "logging_steps": 1,
@@ -5397,7 +5432,7 @@
5397
  "attributes": {}
5398
  }
5399
  },
5400
- "total_flos": 8.552219363455795e+17,
5401
  "train_batch_size": 4,
5402
  "trial_name": null,
5403
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.99644128113879,
5
  "eval_steps": 386,
6
+ "global_step": 770,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5378
  "learning_rate": 9.155915935223121e-05,
5379
  "loss": 0.8196,
5380
  "step": 765
5381
+ },
5382
+ {
5383
+ "epoch": 0.9912649627952119,
5384
+ "grad_norm": 0.6537997722625732,
5385
+ "learning_rate": 9.153622237487127e-05,
5386
+ "loss": 0.6911,
5387
+ "step": 766
5388
+ },
5389
+ {
5390
+ "epoch": 0.9925590423811065,
5391
+ "grad_norm": 0.6952023506164551,
5392
+ "learning_rate": 9.15132571567263e-05,
5393
+ "loss": 0.7354,
5394
+ "step": 767
5395
+ },
5396
+ {
5397
+ "epoch": 0.9938531219670009,
5398
+ "grad_norm": 0.7851712703704834,
5399
+ "learning_rate": 9.149026371341049e-05,
5400
+ "loss": 1.0092,
5401
+ "step": 768
5402
+ },
5403
+ {
5404
+ "epoch": 0.9951472015528955,
5405
+ "grad_norm": 0.8476317524909973,
5406
+ "learning_rate": 9.146724206055725e-05,
5407
+ "loss": 1.0262,
5408
+ "step": 769
5409
+ },
5410
+ {
5411
+ "epoch": 0.99644128113879,
5412
+ "grad_norm": 0.7637205123901367,
5413
+ "learning_rate": 9.144419221381919e-05,
5414
+ "loss": 0.879,
5415
+ "step": 770
5416
  }
5417
  ],
5418
  "logging_steps": 1,
 
5432
  "attributes": {}
5433
  }
5434
  },
5435
+ "total_flos": 8.608116222040474e+17,
5436
  "train_batch_size": 4,
5437
  "trial_name": null,
5438
  "trial_params": null