guyhadad01 commited on
Commit
bb9ae5f
·
verified ·
1 Parent(s): bf4359f

Training in progress, step 10400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1229,6 +1229,10 @@ You can finetune this model on your own dataset.
1229
  | 0.1785 | 10100 | 0.4422 |
1230
  | 0.1794 | 10150 | 0.3747 |
1231
  | 0.1802 | 10200 | 0.3989 |
 
 
 
 
1232
 
1233
 
1234
  ### Framework Versions
 
1229
  | 0.1785 | 10100 | 0.4422 |
1230
  | 0.1794 | 10150 | 0.3747 |
1231
  | 0.1802 | 10200 | 0.3989 |
1232
+ | 0.1811 | 10250 | 0.5315 |
1233
+ | 0.1820 | 10300 | 0.3565 |
1234
+ | 0.1829 | 10350 | 0.4409 |
1235
+ | 0.1838 | 10400 | 0.3762 |
1236
 
1237
 
1238
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b1113f1dc63b4ef74f5c024aa4257a74f5c601162a5392123b472bd440c772d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e173a418a6557a53411f35be06de499d8fc58209e23cd022b66875c6fc5b0ae3
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:372cd21ba6640c7fb2d1ef5b71e6d5270fa8bff460e3c646226db5c68492b951
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f9ee877e3fc6c79f0984700034054c52886bebbe530aecf764a3bd0fec0227
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11b6cb074bbe2129c4a92512f6b7604d9e93435cd6ffac4a406363aba2e66f67
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7e3c346ce1d7e857e6a391133332aa5169f5fc12741629168a0c8fad4aa8ade
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8373615cf09b792af1b9fd441a341b87607a411c0918e8ae083ffab9de6dcc10
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dcdfe9f3f1d3b35aba345a67f9e5702ec3b3998d6ddccfa8925c3c66df7986e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58c8231fde4f806f412947f64ac786f123198ace358add629069cb5de99c1e42
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ba07f8b635a7f5cbd77a454bf0384278026397ef33c00d176608de8376e15fc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.18024067431216978,
6
  "eval_steps": 500,
7
- "global_step": 10200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1436,6 +1436,34 @@
1436
  "learning_rate": 4.5543971255227666e-05,
1437
  "loss": 0.3989,
1438
  "step": 10200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1439
  }
1440
  ],
1441
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.18377480518103587,
6
  "eval_steps": 500,
7
+ "global_step": 10400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1436
  "learning_rate": 4.5543971255227666e-05,
1437
  "loss": 0.3989,
1438
  "step": 10200
1439
+ },
1440
+ {
1441
+ "epoch": 0.1811242070293863,
1442
+ "grad_norm": 1.464385747909546,
1443
+ "learning_rate": 4.549488523688913e-05,
1444
+ "loss": 0.5315,
1445
+ "step": 10250
1446
+ },
1447
+ {
1448
+ "epoch": 0.1820077397466028,
1449
+ "grad_norm": 1.2073971033096313,
1450
+ "learning_rate": 4.544579921855059e-05,
1451
+ "loss": 0.3565,
1452
+ "step": 10300
1453
+ },
1454
+ {
1455
+ "epoch": 0.18289127246381934,
1456
+ "grad_norm": 1.1773017644882202,
1457
+ "learning_rate": 4.5396713200212054e-05,
1458
+ "loss": 0.4409,
1459
+ "step": 10350
1460
+ },
1461
+ {
1462
+ "epoch": 0.18377480518103587,
1463
+ "grad_norm": 2.4389290809631348,
1464
+ "learning_rate": 4.534762718187352e-05,
1465
+ "loss": 0.3762,
1466
+ "step": 10400
1467
  }
1468
  ],
1469
  "logging_steps": 50,