guyhadad01 commited on
Commit
6205692
·
verified ·
1 Parent(s): ae782ab

Training in progress, step 47200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1233,6 +1233,10 @@ You can finetune this model on your own dataset.
1233
  | 0.8288 | 46900 | 0.2756 |
1234
  | 0.8296 | 46950 | 0.3345 |
1235
  | 0.8305 | 47000 | 0.3016 |
 
 
 
 
1236
 
1237
 
1238
  ### Framework Versions
 
1233
  | 0.8288 | 46900 | 0.2756 |
1234
  | 0.8296 | 46950 | 0.3345 |
1235
  | 0.8305 | 47000 | 0.3016 |
1236
+ | 0.8314 | 47050 | 0.2712 |
1237
+ | 0.8323 | 47100 | 0.3721 |
1238
+ | 0.8332 | 47150 | 0.3483 |
1239
+ | 0.8341 | 47200 | 0.3002 |
1240
 
1241
 
1242
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d215026fb98a4e80219f1300f712038cf2fa723f5168816bc64b2547a49bce2f
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbf1ef32acc663cef4a7b10084a698b74270f6eb741911cc2c19a40d4c0c9fe9
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10ceee43905dfe8e32b48bcbafa4954b114ed3adec82f09a2cc6c7e47d869d1b
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b8fd1c7342aa7b1f5feea1cd8fd2a3cbc1f9d6821e77a4dc9f2f20c41b62f35
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:370edc95f3ec87693c2f5c1d97900af678cc360f41a849a73def6dbfd862bd18
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfd2dd2386f51d8558af20986c5a837b3c2dfc1672baa40ef9d7dad6e51ec01
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5927361a532fb6c132d07b4ab7a520caf5f685a6698e2682d0ac3b35fea7ca5e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:424edc0ec5b25fea421881d2bc754b25bc2bf24839236dba41579726e027f84d
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d9635610518cbf3041eab5001840676a9398dea515bdb1588a50299a67cadbe
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9442ef8854cff06718d69b0eacec882112fefdafab14f1f997662b135eaff9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.8305207541835274,
6
  "eval_steps": 500,
7
- "global_step": 47000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6588,6 +6588,34 @@
6588
  "learning_rate": 9.434332724666705e-06,
6589
  "loss": 0.3016,
6590
  "step": 47000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6591
  }
6592
  ],
6593
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.8340548850523934,
6
  "eval_steps": 500,
7
+ "global_step": 47200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6588
  "learning_rate": 9.434332724666705e-06,
6589
  "loss": 0.3016,
6590
  "step": 47000
6591
+ },
6592
+ {
6593
+ "epoch": 0.831404286900744,
6594
+ "grad_norm": 2.7783117294311523,
6595
+ "learning_rate": 9.38524670632817e-06,
6596
+ "loss": 0.2712,
6597
+ "step": 47050
6598
+ },
6599
+ {
6600
+ "epoch": 0.8322878196179605,
6601
+ "grad_norm": 4.626585483551025,
6602
+ "learning_rate": 9.336160687989634e-06,
6603
+ "loss": 0.3721,
6604
+ "step": 47100
6605
+ },
6606
+ {
6607
+ "epoch": 0.8331713523351769,
6608
+ "grad_norm": 1.097589135169983,
6609
+ "learning_rate": 9.287074669651097e-06,
6610
+ "loss": 0.3483,
6611
+ "step": 47150
6612
+ },
6613
+ {
6614
+ "epoch": 0.8340548850523934,
6615
+ "grad_norm": 1.6428859233856201,
6616
+ "learning_rate": 9.237988651312562e-06,
6617
+ "loss": 0.3002,
6618
+ "step": 47200
6619
  }
6620
  ],
6621
  "logging_steps": 50,