guyhadad01 commited on
Commit
fe33828
·
verified ·
1 Parent(s): fc5ed37

Training in progress, step 27200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1201,6 +1201,10 @@ You can finetune this model on your own dataset.
1201
  | 0.4753 | 26900 | 0.5175 |
1202
  | 0.4762 | 26950 | 0.3398 |
1203
  | 0.4771 | 27000 | 0.3683 |
 
 
 
 
1204
 
1205
 
1206
  ### Framework Versions
 
1201
  | 0.4753 | 26900 | 0.5175 |
1202
  | 0.4762 | 26950 | 0.3398 |
1203
  | 0.4771 | 27000 | 0.3683 |
1204
+ | 0.4780 | 27050 | 0.341 |
1205
+ | 0.4789 | 27100 | 0.2753 |
1206
+ | 0.4798 | 27150 | 0.35 |
1207
+ | 0.4806 | 27200 | 0.3143 |
1208
 
1209
 
1210
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:157a36f69c8d6be89b19a5fc2041a6a70bae891ca7bdb6e1f8c5561949e9bafa
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08045e1f2a8cd2432e9fa2b0ef00df2ac4ced1a000f41148266acaf751aa00fe
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cf3f6a255c756d17edb6da60dbf398937995bd4e9513159583e5e4237f23a63
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91e8be442cecb8de3b11e871dbe4b21251728bce4db99665346a4ae741dd9661
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77b7843d303f1fcbcb7ded0ee18633ae1a240b93a82ce64b7dc80620210cefa4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527a9946e2b187cf3aeaac98a6c12f5dc108889d1a7d08a9def35306b103680a
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f721603f06800f16238813b709df823dd021b986d5f3f64a3fdb3ad2473f4313
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6d84e0b16c16a3884265f119b778a7531d56abad22c7b0d844e8a1a93c8456c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b9c472a19e7b9448212aaddb68f6d9878d89c838a06487c2d680b2179532b97
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1ac0dfa5e821d2ce353420d7dc3f3a06dc98c820a2502851855c1f7447269ad
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.47710766729692,
6
  "eval_steps": 500,
7
- "global_step": 27000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3788,6 +3788,34 @@
3788
  "learning_rate": 2.905990457678035e-05,
3789
  "loss": 0.3683,
3790
  "step": 27000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3791
  }
3792
  ],
3793
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.48064179816578606,
6
  "eval_steps": 500,
7
+ "global_step": 27200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3788
  "learning_rate": 2.905990457678035e-05,
3789
  "loss": 0.3683,
3790
  "step": 27000
3791
+ },
3792
+ {
3793
+ "epoch": 0.47799120001413653,
3794
+ "grad_norm": 1.1095103025436401,
3795
+ "learning_rate": 2.9010818558441815e-05,
3796
+ "loss": 0.341,
3797
+ "step": 27050
3798
+ },
3799
+ {
3800
+ "epoch": 0.47887473273135306,
3801
+ "grad_norm": 1.5168321132659912,
3802
+ "learning_rate": 2.8961732540103276e-05,
3803
+ "loss": 0.2753,
3804
+ "step": 27100
3805
+ },
3806
+ {
3807
+ "epoch": 0.4797582654485696,
3808
+ "grad_norm": 1.9980124235153198,
3809
+ "learning_rate": 2.891264652176474e-05,
3810
+ "loss": 0.35,
3811
+ "step": 27150
3812
+ },
3813
+ {
3814
+ "epoch": 0.48064179816578606,
3815
+ "grad_norm": 1.6252918243408203,
3816
+ "learning_rate": 2.8863560503426205e-05,
3817
+ "loss": 0.3143,
3818
+ "step": 27200
3819
  }
3820
  ],
3821
  "logging_steps": 50,