guyhadad01 commited on
Commit
22df50d
·
verified ·
1 Parent(s): 9b8d6b9

Training in progress, step 11200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1245,6 +1245,10 @@ You can finetune this model on your own dataset.
1245
  | 0.1926 | 10900 | 0.4082 |
1246
  | 0.1935 | 10950 | 0.4056 |
1247
  | 0.1944 | 11000 | 0.4435 |
 
 
 
 
1248
 
1249
 
1250
  ### Framework Versions
 
1245
  | 0.1926 | 10900 | 0.4082 |
1246
  | 0.1935 | 10950 | 0.4056 |
1247
  | 0.1944 | 11000 | 0.4435 |
1248
+ | 0.1953 | 11050 | 0.4272 |
1249
+ | 0.1961 | 11100 | 0.4334 |
1250
+ | 0.1970 | 11150 | 0.4479 |
1251
+ | 0.1979 | 11200 | 0.3545 |
1252
 
1253
 
1254
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68fa837444bb1d1983506586971bf36bcb05644b535c7a58278e0f70de2e98b7
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e44300f1a7eda978b714254f7642e5fa8e46c4465149d151fb36c7a22d09887
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22e30cc5ca132903fd2a4ed91cad71091631f1cc2f4eba3197af287eeafbaf42
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:283034d540cc735bf4188ad3d17ee98d86aa7e8c24e656d2a4ff17d9e61dfb8e
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e22fe178097ffc288163bb2b208108bb4bcac4332048a6b0583e8f00c3efbf3d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f802fc7d6b08b3448bdbc5653ab5c831b50c834ee5d8105b5d34c4dfeaebf61e
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43a0047c1f4849b7b6cea19c700df8596a7bc71c9ef39f6ce4cc6960374828c2
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f0df52c717c2e3e1dfb7c95b1b78d2bff8956a86b6980e2bde6913f11a1016
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd72024597b2c3bf8343bfe8c1006caf70bcb94b9f5552f878b8f2c8272ff940
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5330400d6885c6b9af0b1821a1e49b220dac708c65a515f28b9197806d03f3ed
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.19437719778763407,
6
  "eval_steps": 500,
7
- "global_step": 11000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1548,6 +1548,34 @@
1548
  "learning_rate": 4.475957668217785e-05,
1549
  "loss": 0.4435,
1550
  "step": 11000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1551
  }
1552
  ],
1553
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.19791132865650016,
6
  "eval_steps": 500,
7
+ "global_step": 11200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1548
  "learning_rate": 4.475957668217785e-05,
1549
  "loss": 0.4435,
1550
  "step": 11000
1551
+ },
1552
+ {
1553
+ "epoch": 0.1952607305048506,
1554
+ "grad_norm": 2.1512463092803955,
1555
+ "learning_rate": 4.4710490663839315e-05,
1556
+ "loss": 0.4272,
1557
+ "step": 11050
1558
+ },
1559
+ {
1560
+ "epoch": 0.1961442632220671,
1561
+ "grad_norm": 1.5526123046875,
1562
+ "learning_rate": 4.466140464550077e-05,
1563
+ "loss": 0.4334,
1564
+ "step": 11100
1565
+ },
1566
+ {
1567
+ "epoch": 0.19702779593928363,
1568
+ "grad_norm": 1.4258567094802856,
1569
+ "learning_rate": 4.4612318627162245e-05,
1570
+ "loss": 0.4479,
1571
+ "step": 11150
1572
+ },
1573
+ {
1574
+ "epoch": 0.19791132865650016,
1575
+ "grad_norm": 3.2408463954925537,
1576
+ "learning_rate": 4.456323260882371e-05,
1577
+ "loss": 0.3545,
1578
+ "step": 11200
1579
  }
1580
  ],
1581
  "logging_steps": 50,