guyhadad01 commited on
Commit
2a44d0f
·
verified ·
1 Parent(s): 00d5b3a

Training in progress, step 20200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1427,6 +1427,10 @@ You can finetune this model on your own dataset.
1427
  | 0.3516 | 19900 | 0.3636 |
1428
  | 0.3525 | 19950 | 0.3704 |
1429
  | 0.3534 | 20000 | 0.3459 |
 
 
 
 
1430
 
1431
  </details>
1432
 
 
1427
  | 0.3516 | 19900 | 0.3636 |
1428
  | 0.3525 | 19950 | 0.3704 |
1429
  | 0.3534 | 20000 | 0.3459 |
1430
+ | 0.3543 | 20050 | 0.3226 |
1431
+ | 0.3552 | 20100 | 0.3256 |
1432
+ | 0.3561 | 20150 | 0.3179 |
1433
+ | 0.3569 | 20200 | 0.4226 |
1434
 
1435
  </details>
1436
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7072d59f5aacf209413bfe1b68393d31e61f586cffca0291db2c96c4018ed70
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ef29b19104cdd2fee93b8217bc742ea19781fda755240150a391d0a52137790
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ace23ee1b367e732fb2aa3f1a05392e0e438a9535dad79c057fb1b8e02b9d68
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b84ead54747767096d47dd620e6c1d4484392809c929ebd262e713e54fdf126a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14dd25fc849fe74831fabbde14139b26a0f4aad6b8e087440c778d9e11ab8d7e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67d7c2b4ab7e82df68b4a7c174bebe88de85db56b4421a6d44a9a14dfc374b05
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:313073d5ed3020eae2b8815f959d08ffdd33605f3a4a238421bfb13a6954c251
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75cb2a5d4e61624cc82e548180286aa5f7b7073a2bd43f3a7494227c84590e41
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cde16ded14375bc47c997c2d556dc8340b61e53a3892d07fbf99a72d763ffa8d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a28e3c14c246edc1f658e8b3ed3e4804f86c97afddb1e9e8b6cfd065ec104723
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3534130868866074,
6
  "eval_steps": 500,
7
- "global_step": 20000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2808,6 +2808,34 @@
2808
  "learning_rate": 3.5928020262708373e-05,
2809
  "loss": 0.3459,
2810
  "step": 20000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2811
  }
2812
  ],
2813
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3569472177554735,
6
  "eval_steps": 500,
7
+ "global_step": 20200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2808
  "learning_rate": 3.5928020262708373e-05,
2809
  "loss": 0.3459,
2810
  "step": 20000
2811
+ },
2812
+ {
2813
+ "epoch": 0.3542966196038239,
2814
+ "grad_norm": 2.97851824760437,
2815
+ "learning_rate": 3.587893424436983e-05,
2816
+ "loss": 0.3226,
2817
+ "step": 20050
2818
+ },
2819
+ {
2820
+ "epoch": 0.35518015232104044,
2821
+ "grad_norm": 2.1979775428771973,
2822
+ "learning_rate": 3.5829848226031296e-05,
2823
+ "loss": 0.3256,
2824
+ "step": 20100
2825
+ },
2826
+ {
2827
+ "epoch": 0.35606368503825697,
2828
+ "grad_norm": 1.762453556060791,
2829
+ "learning_rate": 3.578076220769276e-05,
2830
+ "loss": 0.3179,
2831
+ "step": 20150
2832
+ },
2833
+ {
2834
+ "epoch": 0.3569472177554735,
2835
+ "grad_norm": 1.4908533096313477,
2836
+ "learning_rate": 3.5731676189354225e-05,
2837
+ "loss": 0.4226,
2838
+ "step": 20200
2839
  }
2840
  ],
2841
  "logging_steps": 50,