Commit
Β·
392dc7b
1
Parent(s):
7963717
Training in progress, step 6600
Browse files- adapter_model.bin +1 -1
- {checkpoint-6200 β checkpoint-6500/adapter_model}/README.md +0 -0
- {checkpoint-6200 β checkpoint-6500/adapter_model}/adapter_config.json +0 -0
- {checkpoint-6200 β checkpoint-6500/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-6200/adapter_model β checkpoint-6600}/README.md +0 -0
- {checkpoint-6200/adapter_model β checkpoint-6600}/adapter_config.json +0 -0
- {checkpoint-6200/adapter_model β checkpoint-6600}/adapter_model.bin +1 -1
- {checkpoint-6200 β checkpoint-6600}/optimizer.pt +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_0.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_1.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_10.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_11.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_12.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_13.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_2.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_3.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_4.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_5.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_6.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_7.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_8.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/rng_state_9.pth +1 -1
- {checkpoint-6200 β checkpoint-6600}/scheduler.pt +1 -1
- {checkpoint-6200 β checkpoint-6600}/trainer_state.json +99 -3
- {checkpoint-6200 β checkpoint-6600}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d81f9de68995df3ae7fe51e14a4d5a0482b3ff50173f115d320ee99247cb5e3d
|
3 |
size 500897101
|
{checkpoint-6200 β checkpoint-6500/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-6200 β checkpoint-6500/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6200 β checkpoint-6500/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eca317a26dab233b92de0d6d401d39cb8b1fe17ca51e4a191e73b88cb76bfc3d
|
3 |
size 500897101
|
{checkpoint-6200/adapter_model β checkpoint-6600}/README.md
RENAMED
File without changes
|
{checkpoint-6200/adapter_model β checkpoint-6600}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-6200/adapter_model β checkpoint-6600}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d81f9de68995df3ae7fe51e14a4d5a0482b3ff50173f115d320ee99247cb5e3d
|
3 |
size 500897101
|
{checkpoint-6200 β checkpoint-6600}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:126ec0322a5714bfa1d9503fe376d8ebf71cc64ffc913454c2c8b48b06bfd15f
|
3 |
size 1001752701
|
{checkpoint-6200 β checkpoint-6600}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a6a609c8ce73fc706f6fb966ebfd028a35b6fc2b3ef2c3b90b14c2d9d96c073
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:513344a4102cc8801ca6a9111665c65ff7e9a337b61788efc4dbd10afd40421e
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84bdaf5f54f27ae7dd4367ad1df5dc5c81c793f62be76df32dd2a92891c0ae9f
|
3 |
size 27789
|
{checkpoint-6200 β checkpoint-6600}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98e58aa58921c7b94e7c72eb60e9c4d6abe4187fa10dfd3dde14df9291075366
|
3 |
size 27789
|
{checkpoint-6200 β checkpoint-6600}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90a0a154457600ec617c2bdbb216fa73b29edafbe85cd1f69bdc45d06510b354
|
3 |
size 27789
|
{checkpoint-6200 β checkpoint-6600}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:702356496f60d3e621103bc084d4848106ba4006fdd2d5ad6640539693a5e42a
|
3 |
size 27789
|
{checkpoint-6200 β checkpoint-6600}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:046a0af63804ca31a141d5015a52b23ee2774bb6e4992759b32c342ddc173129
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4eb3a5e7cd3e2477ec830ebb148f6b3b4ae734efaa4086c861d75bd02f98d32d
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dfd38532c9714d2d07dcbded515916fc4a2a8ebf7809eb89c8e40ba30623300
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6d24543c66c5d1f88ce0e125b12e7a3822599ea0fc5c8774770d4b6e36e9a0a
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e194294db8d8734e6cc4d219d1f312dace676b799dac00f96ab1b32058105929
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1970a2d9f7cb4f5fff840955a3b522a1b4bb096917d81f71d05d1ab7512a2d1a
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4d396595cc95649a6e4b094f41829540f57ac9e24ad4e6eb37d58aac423d45a
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aed28956ad5859c504e2fb1745186ccc74f16e74b31582a197cb9dcab20b3d56
|
3 |
size 27772
|
{checkpoint-6200 β checkpoint-6600}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:152f426be01aff254cb20a567c7989c603706f46efd9a2a941b2d4911bff72ad
|
3 |
size 627
|
{checkpoint-6200 β checkpoint-6600}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1518,11 +1518,107 @@
|
|
1518 |
"learning_rate": 1.8898031366808467e-05,
|
1519 |
"loss": 0.7654,
|
1520 |
"step": 6200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1521 |
}
|
1522 |
],
|
1523 |
"max_steps": 7737,
|
1524 |
"num_train_epochs": 3,
|
1525 |
-
"total_flos": 2.
|
1526 |
"trial_name": null,
|
1527 |
"trial_params": null
|
1528 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.5591314462970143,
|
5 |
+
"global_step": 6600,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1518 |
"learning_rate": 1.8898031366808467e-05,
|
1519 |
"loss": 0.7654,
|
1520 |
"step": 6200
|
1521 |
+
},
|
1522 |
+
{
|
1523 |
+
"epoch": 2.41,
|
1524 |
+
"learning_rate": 1.830759827462004e-05,
|
1525 |
+
"loss": 0.7753,
|
1526 |
+
"step": 6225
|
1527 |
+
},
|
1528 |
+
{
|
1529 |
+
"epoch": 2.42,
|
1530 |
+
"learning_rate": 1.7725605054497906e-05,
|
1531 |
+
"loss": 0.7725,
|
1532 |
+
"step": 6250
|
1533 |
+
},
|
1534 |
+
{
|
1535 |
+
"epoch": 2.43,
|
1536 |
+
"learning_rate": 1.7152111833800522e-05,
|
1537 |
+
"loss": 0.7698,
|
1538 |
+
"step": 6275
|
1539 |
+
},
|
1540 |
+
{
|
1541 |
+
"epoch": 2.44,
|
1542 |
+
"learning_rate": 1.6587177861727454e-05,
|
1543 |
+
"loss": 0.7703,
|
1544 |
+
"step": 6300
|
1545 |
+
},
|
1546 |
+
{
|
1547 |
+
"epoch": 2.45,
|
1548 |
+
"learning_rate": 1.6030861503198204e-05,
|
1549 |
+
"loss": 0.7658,
|
1550 |
+
"step": 6325
|
1551 |
+
},
|
1552 |
+
{
|
1553 |
+
"epoch": 2.46,
|
1554 |
+
"learning_rate": 1.548322023282235e-05,
|
1555 |
+
"loss": 0.7677,
|
1556 |
+
"step": 6350
|
1557 |
+
},
|
1558 |
+
{
|
1559 |
+
"epoch": 2.47,
|
1560 |
+
"learning_rate": 1.4944310628961666e-05,
|
1561 |
+
"loss": 0.7694,
|
1562 |
+
"step": 6375
|
1563 |
+
},
|
1564 |
+
{
|
1565 |
+
"epoch": 2.48,
|
1566 |
+
"learning_rate": 1.4414188367884907e-05,
|
1567 |
+
"loss": 0.7668,
|
1568 |
+
"step": 6400
|
1569 |
+
},
|
1570 |
+
{
|
1571 |
+
"epoch": 2.49,
|
1572 |
+
"learning_rate": 1.3892908218015654e-05,
|
1573 |
+
"loss": 0.7662,
|
1574 |
+
"step": 6425
|
1575 |
+
},
|
1576 |
+
{
|
1577 |
+
"epoch": 2.5,
|
1578 |
+
"learning_rate": 1.3380524034274122e-05,
|
1579 |
+
"loss": 0.7689,
|
1580 |
+
"step": 6450
|
1581 |
+
},
|
1582 |
+
{
|
1583 |
+
"epoch": 2.51,
|
1584 |
+
"learning_rate": 1.2877088752513189e-05,
|
1585 |
+
"loss": 0.7694,
|
1586 |
+
"step": 6475
|
1587 |
+
},
|
1588 |
+
{
|
1589 |
+
"epoch": 2.52,
|
1590 |
+
"learning_rate": 1.2382654384049475e-05,
|
1591 |
+
"loss": 0.7714,
|
1592 |
+
"step": 6500
|
1593 |
+
},
|
1594 |
+
{
|
1595 |
+
"epoch": 2.53,
|
1596 |
+
"learning_rate": 1.1897272010289884e-05,
|
1597 |
+
"loss": 0.7701,
|
1598 |
+
"step": 6525
|
1599 |
+
},
|
1600 |
+
{
|
1601 |
+
"epoch": 2.54,
|
1602 |
+
"learning_rate": 1.1420991777454315e-05,
|
1603 |
+
"loss": 0.7628,
|
1604 |
+
"step": 6550
|
1605 |
+
},
|
1606 |
+
{
|
1607 |
+
"epoch": 2.55,
|
1608 |
+
"learning_rate": 1.0953862891394795e-05,
|
1609 |
+
"loss": 0.7661,
|
1610 |
+
"step": 6575
|
1611 |
+
},
|
1612 |
+
{
|
1613 |
+
"epoch": 2.56,
|
1614 |
+
"learning_rate": 1.0495933612511976e-05,
|
1615 |
+
"loss": 0.7729,
|
1616 |
+
"step": 6600
|
1617 |
}
|
1618 |
],
|
1619 |
"max_steps": 7737,
|
1620 |
"num_train_epochs": 3,
|
1621 |
+
"total_flos": 2.842466784500515e+19,
|
1622 |
"trial_name": null,
|
1623 |
"trial_params": null
|
1624 |
}
|
{checkpoint-6200 β checkpoint-6600}/training_args.bin
RENAMED
File without changes
|