ZeroUniqueness commited on
Commit
392dc7b
Β·
1 Parent(s): 7963717

Training in progress, step 6600

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-6200 β†’ checkpoint-6500/adapter_model}/README.md +0 -0
  3. {checkpoint-6200 β†’ checkpoint-6500/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-6200 β†’ checkpoint-6500/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-6200/adapter_model β†’ checkpoint-6600}/README.md +0 -0
  6. {checkpoint-6200/adapter_model β†’ checkpoint-6600}/adapter_config.json +0 -0
  7. {checkpoint-6200/adapter_model β†’ checkpoint-6600}/adapter_model.bin +1 -1
  8. {checkpoint-6200 β†’ checkpoint-6600}/optimizer.pt +1 -1
  9. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_0.pth +1 -1
  10. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_1.pth +1 -1
  11. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_10.pth +1 -1
  12. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_11.pth +1 -1
  13. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_12.pth +1 -1
  14. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_13.pth +1 -1
  15. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_2.pth +1 -1
  16. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_3.pth +1 -1
  17. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_4.pth +1 -1
  18. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_5.pth +1 -1
  19. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_6.pth +1 -1
  20. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_7.pth +1 -1
  21. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_8.pth +1 -1
  22. {checkpoint-6200 β†’ checkpoint-6600}/rng_state_9.pth +1 -1
  23. {checkpoint-6200 β†’ checkpoint-6600}/scheduler.pt +1 -1
  24. {checkpoint-6200 β†’ checkpoint-6600}/trainer_state.json +99 -3
  25. {checkpoint-6200 β†’ checkpoint-6600}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eca317a26dab233b92de0d6d401d39cb8b1fe17ca51e4a191e73b88cb76bfc3d
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81f9de68995df3ae7fe51e14a4d5a0482b3ff50173f115d320ee99247cb5e3d
3
  size 500897101
{checkpoint-6200 β†’ checkpoint-6500/adapter_model}/README.md RENAMED
File without changes
{checkpoint-6200 β†’ checkpoint-6500/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-6200 β†’ checkpoint-6500/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3febec860772b82c489867736d215315d0909ffc43a3ba7b9fbc1d0b41fd7a20
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eca317a26dab233b92de0d6d401d39cb8b1fe17ca51e4a191e73b88cb76bfc3d
3
  size 500897101
{checkpoint-6200/adapter_model β†’ checkpoint-6600}/README.md RENAMED
File without changes
{checkpoint-6200/adapter_model β†’ checkpoint-6600}/adapter_config.json RENAMED
File without changes
{checkpoint-6200/adapter_model β†’ checkpoint-6600}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3febec860772b82c489867736d215315d0909ffc43a3ba7b9fbc1d0b41fd7a20
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81f9de68995df3ae7fe51e14a4d5a0482b3ff50173f115d320ee99247cb5e3d
3
  size 500897101
{checkpoint-6200 β†’ checkpoint-6600}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6c238a192e64d590edb62f130ceed462095ecf868445a5da756e160d8783d7e
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:126ec0322a5714bfa1d9503fe376d8ebf71cc64ffc913454c2c8b48b06bfd15f
3
  size 1001752701
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a62682ba7e7cb26595ded7f48ec753d2eb9673721db81b0ec4152ba6856f2d2
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a6a609c8ce73fc706f6fb966ebfd028a35b6fc2b3ef2c3b90b14c2d9d96c073
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74be203c1e4634b2aa1037ec3a4a9edd5a7298915ce425cf1b9a31f6391efca1
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:513344a4102cc8801ca6a9111665c65ff7e9a337b61788efc4dbd10afd40421e
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c037a2c235445f0da915de6619ff6f7f42b2c0c8575b787c1a4ed16e35b61d21
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84bdaf5f54f27ae7dd4367ad1df5dc5c81c793f62be76df32dd2a92891c0ae9f
3
  size 27789
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b62b1f601e03a003f84cf80a8c292113d141ee87f5b1ca845fff2a924a30938e
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98e58aa58921c7b94e7c72eb60e9c4d6abe4187fa10dfd3dde14df9291075366
3
  size 27789
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c758852b4f6179b67806b64c03556a85fc8cb6b2d7fc9b9802e599d92cb5060
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90a0a154457600ec617c2bdbb216fa73b29edafbe85cd1f69bdc45d06510b354
3
  size 27789
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:212ebbd04054c53230c6f37560d76104b53022b0398cb77838fa4b24148235e3
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:702356496f60d3e621103bc084d4848106ba4006fdd2d5ad6640539693a5e42a
3
  size 27789
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b20af4a6e33875e1906da2f4f958007730c9409557ca3cdfa5b4dc59f51e2d5
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:046a0af63804ca31a141d5015a52b23ee2774bb6e4992759b32c342ddc173129
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f749729546f0e74d9ecf3ad24fea7d29dd1ae76d88741fcdcf02b50df73302c
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eb3a5e7cd3e2477ec830ebb148f6b3b4ae734efaa4086c861d75bd02f98d32d
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c21e5a49b0e24cc974d1d7d4406b9728cbea5332e18346ba9afb35e0372f526
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dfd38532c9714d2d07dcbded515916fc4a2a8ebf7809eb89c8e40ba30623300
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a33c776cc1ad3767cdac6f06b81c8d34fcc1d3ad73a9f8803254d0d817aa09a
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6d24543c66c5d1f88ce0e125b12e7a3822599ea0fc5c8774770d4b6e36e9a0a
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64fcf9ef649f08b421dd4acc8e2b02fc8f3ffefc82b05ef17dde8609c9d4bb40
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e194294db8d8734e6cc4d219d1f312dace676b799dac00f96ab1b32058105929
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbea4f476c6f296b74387728b4c7179586b903ae8344e377cc5ce9725f14ba69
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1970a2d9f7cb4f5fff840955a3b522a1b4bb096917d81f71d05d1ab7512a2d1a
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecac165f822fec78a8825820ff7d48e36aa3f53cb41f7a57d2e9dfadf8de351a
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4d396595cc95649a6e4b094f41829540f57ac9e24ad4e6eb37d58aac423d45a
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba8091a98c98de998b6ead9067c77d9531ff0bb7b308e548615a3a1c2ec0f7e8
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aed28956ad5859c504e2fb1745186ccc74f16e74b31582a197cb9dcab20b3d56
3
  size 27772
{checkpoint-6200 β†’ checkpoint-6600}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a2465347a031d34e4adae1fd19f3f075689a8b84714f2008d365cd61979bafe
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:152f426be01aff254cb20a567c7989c603706f46efd9a2a941b2d4911bff72ad
3
  size 627
{checkpoint-6200 β†’ checkpoint-6600}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.404032570763862,
5
- "global_step": 6200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1518,11 +1518,107 @@
1518
  "learning_rate": 1.8898031366808467e-05,
1519
  "loss": 0.7654,
1520
  "step": 6200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1521
  }
1522
  ],
1523
  "max_steps": 7737,
1524
  "num_train_epochs": 3,
1525
- "total_flos": 2.6702654094117437e+19,
1526
  "trial_name": null,
1527
  "trial_params": null
1528
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.5591314462970143,
5
+ "global_step": 6600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1518
  "learning_rate": 1.8898031366808467e-05,
1519
  "loss": 0.7654,
1520
  "step": 6200
1521
+ },
1522
+ {
1523
+ "epoch": 2.41,
1524
+ "learning_rate": 1.830759827462004e-05,
1525
+ "loss": 0.7753,
1526
+ "step": 6225
1527
+ },
1528
+ {
1529
+ "epoch": 2.42,
1530
+ "learning_rate": 1.7725605054497906e-05,
1531
+ "loss": 0.7725,
1532
+ "step": 6250
1533
+ },
1534
+ {
1535
+ "epoch": 2.43,
1536
+ "learning_rate": 1.7152111833800522e-05,
1537
+ "loss": 0.7698,
1538
+ "step": 6275
1539
+ },
1540
+ {
1541
+ "epoch": 2.44,
1542
+ "learning_rate": 1.6587177861727454e-05,
1543
+ "loss": 0.7703,
1544
+ "step": 6300
1545
+ },
1546
+ {
1547
+ "epoch": 2.45,
1548
+ "learning_rate": 1.6030861503198204e-05,
1549
+ "loss": 0.7658,
1550
+ "step": 6325
1551
+ },
1552
+ {
1553
+ "epoch": 2.46,
1554
+ "learning_rate": 1.548322023282235e-05,
1555
+ "loss": 0.7677,
1556
+ "step": 6350
1557
+ },
1558
+ {
1559
+ "epoch": 2.47,
1560
+ "learning_rate": 1.4944310628961666e-05,
1561
+ "loss": 0.7694,
1562
+ "step": 6375
1563
+ },
1564
+ {
1565
+ "epoch": 2.48,
1566
+ "learning_rate": 1.4414188367884907e-05,
1567
+ "loss": 0.7668,
1568
+ "step": 6400
1569
+ },
1570
+ {
1571
+ "epoch": 2.49,
1572
+ "learning_rate": 1.3892908218015654e-05,
1573
+ "loss": 0.7662,
1574
+ "step": 6425
1575
+ },
1576
+ {
1577
+ "epoch": 2.5,
1578
+ "learning_rate": 1.3380524034274122e-05,
1579
+ "loss": 0.7689,
1580
+ "step": 6450
1581
+ },
1582
+ {
1583
+ "epoch": 2.51,
1584
+ "learning_rate": 1.2877088752513189e-05,
1585
+ "loss": 0.7694,
1586
+ "step": 6475
1587
+ },
1588
+ {
1589
+ "epoch": 2.52,
1590
+ "learning_rate": 1.2382654384049475e-05,
1591
+ "loss": 0.7714,
1592
+ "step": 6500
1593
+ },
1594
+ {
1595
+ "epoch": 2.53,
1596
+ "learning_rate": 1.1897272010289884e-05,
1597
+ "loss": 0.7701,
1598
+ "step": 6525
1599
+ },
1600
+ {
1601
+ "epoch": 2.54,
1602
+ "learning_rate": 1.1420991777454315e-05,
1603
+ "loss": 0.7628,
1604
+ "step": 6550
1605
+ },
1606
+ {
1607
+ "epoch": 2.55,
1608
+ "learning_rate": 1.0953862891394795e-05,
1609
+ "loss": 0.7661,
1610
+ "step": 6575
1611
+ },
1612
+ {
1613
+ "epoch": 2.56,
1614
+ "learning_rate": 1.0495933612511976e-05,
1615
+ "loss": 0.7729,
1616
+ "step": 6600
1617
  }
1618
  ],
1619
  "max_steps": 7737,
1620
  "num_train_epochs": 3,
1621
+ "total_flos": 2.842466784500515e+19,
1622
  "trial_name": null,
1623
  "trial_params": null
1624
  }
{checkpoint-6200 β†’ checkpoint-6600}/training_args.bin RENAMED
File without changes