guyhadad01 commited on
Commit
60d4c48
·
verified ·
1 Parent(s): 061100c

Training in progress, step 26800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1193,6 +1193,10 @@ You can finetune this model on your own dataset.
1193
  | 0.4683 | 26500 | 0.3204 |
1194
  | 0.4692 | 26550 | 0.2698 |
1195
  | 0.4700 | 26600 | 0.3019 |
 
 
 
 
1196
 
1197
 
1198
  ### Framework Versions
 
1193
  | 0.4683 | 26500 | 0.3204 |
1194
  | 0.4692 | 26550 | 0.2698 |
1195
  | 0.4700 | 26600 | 0.3019 |
1196
+ | 0.4709 | 26650 | 0.276 |
1197
+ | 0.4718 | 26700 | 0.2572 |
1198
+ | 0.4727 | 26750 | 0.2821 |
1199
+ | 0.4736 | 26800 | 0.2753 |
1200
 
1201
 
1202
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efcfe5aa0c5005b2003bf869f963a20c876745fa7f627f40c3819a73de45b137
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af9e8fc53f229d8df337a8754e2d3d5b113d4716605b013bad83e9e09dacdb0
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e583966410e9fff5f8ac46b24676c49f860c538a27398df242344bd0d2a7d08c
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de6d4daedba612d713f9144d945bcc7668fddc99a7c572a8a7ecdaadfce55d9f
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bea9f5fcadeb0cd0d9a943463b72fc5766ebc9e57169008c5a18a91f57902fe
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd90d4d272f52093bcd166fb2fee1129e8da49cd6cade68a0c1872a9ab44bae6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc231b83c50d1c7b06b068e6375671742fac1a054d31705297b772d1dffbf9a2
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9102615210716abefe38c971af7617c4ceba795e3412ef59968e79b6fe53891e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93fabb93104e1056a717edb04db9d7d8955bbdc038b375db1506268b873e6fee
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ca320c82587b083501742caf7cc80ec1a98ca247bf4b8c7cd91053ff97a2d44
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.4700394055591879,
6
  "eval_steps": 500,
7
- "global_step": 26600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3732,6 +3732,34 @@
3732
  "learning_rate": 2.9452592723488643e-05,
3733
  "loss": 0.3019,
3734
  "step": 26600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3735
  }
3736
  ],
3737
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.47357353642805394,
6
  "eval_steps": 500,
7
+ "global_step": 26800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3732
  "learning_rate": 2.9452592723488643e-05,
3733
  "loss": 0.3019,
3734
  "step": 26600
3735
+ },
3736
+ {
3737
+ "epoch": 0.47092293827640436,
3738
+ "grad_norm": 1.6362017393112183,
3739
+ "learning_rate": 2.9403506705150108e-05,
3740
+ "loss": 0.276,
3741
+ "step": 26650
3742
+ },
3743
+ {
3744
+ "epoch": 0.4718064709936209,
3745
+ "grad_norm": 1.5143210887908936,
3746
+ "learning_rate": 2.935442068681157e-05,
3747
+ "loss": 0.2572,
3748
+ "step": 26700
3749
+ },
3750
+ {
3751
+ "epoch": 0.4726900037108374,
3752
+ "grad_norm": 2.1000730991363525,
3753
+ "learning_rate": 2.9305334668473034e-05,
3754
+ "loss": 0.2821,
3755
+ "step": 26750
3756
+ },
3757
+ {
3758
+ "epoch": 0.47357353642805394,
3759
+ "grad_norm": 1.9400396347045898,
3760
+ "learning_rate": 2.9256248650134498e-05,
3761
+ "loss": 0.2753,
3762
+ "step": 26800
3763
  }
3764
  ],
3765
  "logging_steps": 50,