guyhadad01 commited on
Commit
5b8016b
·
verified ·
1 Parent(s): 987b620

Training in progress, step 36000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1233,6 +1233,10 @@ You can finetune this model on your own dataset.
1233
  | 0.6308 | 35700 | 0.312 |
1234
  | 0.6317 | 35750 | 0.2776 |
1235
  | 0.6326 | 35800 | 0.2574 |
 
 
 
 
1236
 
1237
 
1238
  ### Framework Versions
 
1233
  | 0.6308 | 35700 | 0.312 |
1234
  | 0.6317 | 35750 | 0.2776 |
1235
  | 0.6326 | 35800 | 0.2574 |
1236
+ | 0.6335 | 35850 | 0.2816 |
1237
+ | 0.6344 | 35900 | 0.3392 |
1238
+ | 0.6353 | 35950 | 0.2856 |
1239
+ | 0.6361 | 36000 | 0.286 |
1240
 
1241
 
1242
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bae377c97d95c091e602ea66921e5e1054c92655fcc87b72a9e144d35f4777b9
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14b384b5f887acee5a6096737f368c3613e7537b072283344d0460f9ee33683f
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53dd7b57f3f8c10ab9b2a35f0933e4ed0758fa2fa30468c3dcc9a374cbfea064
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94f7c656111e857b9a5964461ddb67ba8434de7b657a0de6cf811249e9f135c7
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21564110007d55db6f6a52d1c9590217ce427ced36eba0a8dc124d9288a67d6c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83863be742a336d65a58bf9026fc223fa44e5cc37215b2331b9a723f209bc947
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ecaf6e4f08856d634b99dd1969eedbd96a7e22708903309e7e68fda2bacc394
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1b02513987752f55c2a09cb46fb561fd6490aaf9c1a9fb121a08671c8653dcd
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7083008eae1faaed45dcde0eba354b7d59a06375dff301d884f49f745cc4e30
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e587de7316b1032258fa34321e4e4cbe60d0a5d83b11f22c68cdcdf7469e3a42
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6326094255270273,
6
  "eval_steps": 500,
7
- "global_step": 35800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5020,6 +5020,34 @@
5020
  "learning_rate": 2.0423710510298248e-05,
5021
  "loss": 0.2574,
5022
  "step": 35800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5023
  }
5024
  ],
5025
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6361435563958934,
6
  "eval_steps": 500,
7
+ "global_step": 36000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5020
  "learning_rate": 2.0423710510298248e-05,
5021
  "loss": 0.2574,
5022
  "step": 35800
5023
+ },
5024
+ {
5025
+ "epoch": 0.6334929582442438,
5026
+ "grad_norm": 1.6969387531280518,
5027
+ "learning_rate": 2.0374624491959713e-05,
5028
+ "loss": 0.2816,
5029
+ "step": 35850
5030
+ },
5031
+ {
5032
+ "epoch": 0.6343764909614603,
5033
+ "grad_norm": 2.4319510459899902,
5034
+ "learning_rate": 2.0325538473621174e-05,
5035
+ "loss": 0.3392,
5036
+ "step": 35900
5037
+ },
5038
+ {
5039
+ "epoch": 0.6352600236786768,
5040
+ "grad_norm": 1.4081567525863647,
5041
+ "learning_rate": 2.027645245528264e-05,
5042
+ "loss": 0.2856,
5043
+ "step": 35950
5044
+ },
5045
+ {
5046
+ "epoch": 0.6361435563958934,
5047
+ "grad_norm": 1.2967078685760498,
5048
+ "learning_rate": 2.02273664369441e-05,
5049
+ "loss": 0.286,
5050
+ "step": 36000
5051
  }
5052
  ],
5053
  "logging_steps": 50,