guyhadad01 commited on
Commit
180004e
·
verified ·
1 Parent(s): 3f73c1b

Training in progress, step 43000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1375,6 +1375,10 @@ You can finetune this model on your own dataset.
1375
  | 0.7545 | 42700 | 0.3352 |
1376
  | 0.7554 | 42750 | 0.3143 |
1377
  | 0.7563 | 42800 | 0.2833 |
 
 
 
 
1378
 
1379
  </details>
1380
 
 
1375
  | 0.7545 | 42700 | 0.3352 |
1376
  | 0.7554 | 42750 | 0.3143 |
1377
  | 0.7563 | 42800 | 0.2833 |
1378
+ | 0.7572 | 42850 | 0.2851 |
1379
+ | 0.7581 | 42900 | 0.2956 |
1380
+ | 0.7590 | 42950 | 0.3038 |
1381
+ | 0.7598 | 43000 | 0.2195 |
1382
 
1383
  </details>
1384
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:947ad26bf0a1ea98a40d7847b1d4081968d0ea03f777dd415d118a3341c7d595
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75caeec9f53b9b891200013c0a2fd18951ed97d80436096583e4cb1480de71e5
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbe6b037eef5d6174a1e64a06f40631b730395d9ff0774dfc1245b870b5a756f
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1f4e8d78cc6baa416d9c6a87aa0b3025829063989d02f0b2a8b88b559ded826
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a0a70fc822cbf0577f57f474f054d71e07e1660e7791d186284f5053153721d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be9a690b209a02eb17ce8e3f85da6cd14d4dc8a1275cbf619841edc0fbfa444
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31395f18239b3bc788fb9174ae1acda597a1a3b63f5595848ade3391438691e5
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cac2489bb213d35fe01f779a670cf1cba6053f86765e6ddff3ab2ce908e2308
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff01474c5f0e5dbd5aec03f387f08f61e0a9ae8d77c69168920103f17f16f317
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beb8449b565ba883e76cbff731d0f062ded7c2721b6cab570d00dd75a772df6d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7563040059373398,
6
  "eval_steps": 500,
7
- "global_step": 42800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6000,6 +6000,34 @@
6000
  "learning_rate": 1.3555594824370226e-05,
6001
  "loss": 0.2833,
6002
  "step": 42800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6003
  }
6004
  ],
6005
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7598381368062059,
6
  "eval_steps": 500,
7
+ "global_step": 43000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6000
  "learning_rate": 1.3555594824370226e-05,
6001
  "loss": 0.2833,
6002
  "step": 42800
6003
+ },
6004
+ {
6005
+ "epoch": 0.7571875386545563,
6006
+ "grad_norm": 1.5535756349563599,
6007
+ "learning_rate": 1.350650880603169e-05,
6008
+ "loss": 0.2851,
6009
+ "step": 42850
6010
+ },
6011
+ {
6012
+ "epoch": 0.7580710713717729,
6013
+ "grad_norm": 1.3919951915740967,
6014
+ "learning_rate": 1.3457422787693156e-05,
6015
+ "loss": 0.2956,
6016
+ "step": 42900
6017
+ },
6018
+ {
6019
+ "epoch": 0.7589546040889894,
6020
+ "grad_norm": 1.531242847442627,
6021
+ "learning_rate": 1.3408336769354619e-05,
6022
+ "loss": 0.3038,
6023
+ "step": 42950
6024
+ },
6025
+ {
6026
+ "epoch": 0.7598381368062059,
6027
+ "grad_norm": 1.4396170377731323,
6028
+ "learning_rate": 1.335925075101608e-05,
6029
+ "loss": 0.2195,
6030
+ "step": 43000
6031
  }
6032
  ],
6033
  "logging_steps": 50,