guyhadad01 commited on
Commit
ebff636
·
verified ·
1 Parent(s): 19b1d00

Training in progress, step 28600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1229,6 +1229,10 @@ You can finetune this model on your own dataset.
1229
  | 0.5001 | 28300 | 0.3338 |
1230
  | 0.5010 | 28350 | 0.3109 |
1231
  | 0.5018 | 28400 | 0.3234 |
 
 
 
 
1232
 
1233
 
1234
  ### Framework Versions
 
1229
  | 0.5001 | 28300 | 0.3338 |
1230
  | 0.5010 | 28350 | 0.3109 |
1231
  | 0.5018 | 28400 | 0.3234 |
1232
+ | 0.5027 | 28450 | 0.3257 |
1233
+ | 0.5036 | 28500 | 0.4675 |
1234
+ | 0.5045 | 28550 | 0.4318 |
1235
+ | 0.5054 | 28600 | 0.3594 |
1236
 
1237
 
1238
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63181bf09a1c611c492c8b6ad279006fb56b9805969d0edba71cff3ee723a234
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1974b8b79f821393033413b708b3d76af02ee0630fc769c360d30160ba1e49c
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1746c035958eb9e0a972414e56f8fa4733c0402b003adb0be00e93e8ce71e93
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80de25a64d3a7f9b01d3ac384a24ef9565f911507016f6cb2ebb2675cd2fca9a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:febec73de51eb7db9177092196a53a5124fb83edff44db6d3e9496c1ee972476
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:104316cbc87d14059ece260dae5c5774e3d91c358c1eb53b1e4cc6f9aa5826ec
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5147f98e53184b8dd37c8115204cda76018272755476678192eccb1efdd5d07
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ed0a067ae758f61df93eb0349389528a459caaf90517ed5419a4c3a8ab14656
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:953c76ee5b14f1426684c90829d80bb305b640c5a3e12732ffb64cce4b8f5126
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c41c0a76cd352649e53d0354e3152b28ade5f9653e46110b22a1db6134af332
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5018465833789825,
6
  "eval_steps": 500,
7
- "global_step": 28400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3984,6 +3984,34 @@
3984
  "learning_rate": 2.768549606330133e-05,
3985
  "loss": 0.3234,
3986
  "step": 28400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3987
  }
3988
  ],
3989
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5053807142478486,
6
  "eval_steps": 500,
7
+ "global_step": 28600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3984
  "learning_rate": 2.768549606330133e-05,
3985
  "loss": 0.3234,
3986
  "step": 28400
3987
+ },
3988
+ {
3989
+ "epoch": 0.502730116096199,
3990
+ "grad_norm": 1.497454285621643,
3991
+ "learning_rate": 2.7636410044962795e-05,
3992
+ "loss": 0.3257,
3993
+ "step": 28450
3994
+ },
3995
+ {
3996
+ "epoch": 0.5036136488134155,
3997
+ "grad_norm": 3.3886194229125977,
3998
+ "learning_rate": 2.7587324026624256e-05,
3999
+ "loss": 0.4675,
4000
+ "step": 28500
4001
+ },
4002
+ {
4003
+ "epoch": 0.504497181530632,
4004
+ "grad_norm": 1.6604270935058594,
4005
+ "learning_rate": 2.753823800828572e-05,
4006
+ "loss": 0.4318,
4007
+ "step": 28550
4008
+ },
4009
+ {
4010
+ "epoch": 0.5053807142478486,
4011
+ "grad_norm": 1.7005223035812378,
4012
+ "learning_rate": 2.7489151989947186e-05,
4013
+ "loss": 0.3594,
4014
+ "step": 28600
4015
  }
4016
  ],
4017
  "logging_steps": 50,