Training in progress, step 750
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +32 -0
- training_args.bin +2 -2
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b72e0a03170a66b4b4c45fb0f17e335677139587679140101ae70fbd9afd74f8
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83b0989d867d0e8c05bc25212c1e974719b4664c240aad04c84d3dd0725d3243
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:225f479523920e94a01f625a06b478b1f5ff94617846dbfbb0f30b71adf6ef17
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1258c37d5d8fbfc4431f62df566ab3877627b5ade68502fef5c584c461b06b84
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -726,3 +726,35 @@
|
|
726 |
{"current_steps": 726, "total_steps": 759, "loss": 0.3794, "lr": 5.748998743166256e-08, "epoch": 2.867676102699144, "percentage": 95.65, "elapsed_time": "6:13:47", "remaining_time": "0:16:59"}
|
727 |
{"current_steps": 727, "total_steps": 759, "loss": 0.3815, "lr": 5.4064735165506035e-08, "epoch": 2.871626069782752, "percentage": 95.78, "elapsed_time": "6:14:10", "remaining_time": "0:16:28"}
|
728 |
{"current_steps": 728, "total_steps": 759, "loss": 0.3654, "lr": 5.0744124891748956e-08, "epoch": 2.8755760368663594, "percentage": 95.92, "elapsed_time": "6:14:33", "remaining_time": "0:15:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
726 |
{"current_steps": 726, "total_steps": 759, "loss": 0.3794, "lr": 5.748998743166256e-08, "epoch": 2.867676102699144, "percentage": 95.65, "elapsed_time": "6:13:47", "remaining_time": "0:16:59"}
|
727 |
{"current_steps": 727, "total_steps": 759, "loss": 0.3815, "lr": 5.4064735165506035e-08, "epoch": 2.871626069782752, "percentage": 95.78, "elapsed_time": "6:14:10", "remaining_time": "0:16:28"}
|
728 |
{"current_steps": 728, "total_steps": 759, "loss": 0.3654, "lr": 5.0744124891748956e-08, "epoch": 2.8755760368663594, "percentage": 95.92, "elapsed_time": "6:14:33", "remaining_time": "0:15:56"}
|
729 |
+
{"current_steps": 729, "total_steps": 759, "loss": 0.3561, "lr": 4.7528226865107274e-08, "epoch": 2.879526003949967, "percentage": 96.05, "elapsed_time": "6:14:57", "remaining_time": "0:15:25"}
|
730 |
+
{"current_steps": 730, "total_steps": 759, "loss": 0.3741, "lr": 4.4417109124882394e-08, "epoch": 2.8834759710335747, "percentage": 96.18, "elapsed_time": "6:15:20", "remaining_time": "0:14:54"}
|
731 |
+
{"current_steps": 731, "total_steps": 759, "loss": 0.3726, "lr": 4.1410837493519595e-08, "epoch": 2.8874259381171825, "percentage": 96.31, "elapsed_time": "6:17:14", "remaining_time": "0:14:26"}
|
732 |
+
{"current_steps": 732, "total_steps": 759, "loss": 0.3851, "lr": 3.8509475575219115e-08, "epoch": 2.89137590520079, "percentage": 96.44, "elapsed_time": "6:17:37", "remaining_time": "0:13:55"}
|
733 |
+
{"current_steps": 733, "total_steps": 759, "loss": 0.3669, "lr": 3.571308475458723e-08, "epoch": 2.8953258722843978, "percentage": 96.57, "elapsed_time": "6:18:00", "remaining_time": "0:13:24"}
|
734 |
+
{"current_steps": 734, "total_steps": 759, "loss": 0.357, "lr": 3.302172419534011e-08, "epoch": 2.899275839368005, "percentage": 96.71, "elapsed_time": "6:18:23", "remaining_time": "0:12:53"}
|
735 |
+
{"current_steps": 735, "total_steps": 759, "loss": 0.3399, "lr": 3.04354508390492e-08, "epoch": 2.903225806451613, "percentage": 96.84, "elapsed_time": "6:18:46", "remaining_time": "0:12:22"}
|
736 |
+
{"current_steps": 736, "total_steps": 759, "loss": 0.368, "lr": 2.7954319403940555e-08, "epoch": 2.9071757735352204, "percentage": 96.97, "elapsed_time": "6:19:09", "remaining_time": "0:11:50"}
|
737 |
+
{"current_steps": 737, "total_steps": 759, "loss": 0.3574, "lr": 2.5578382383732446e-08, "epoch": 2.9111257406188282, "percentage": 97.1, "elapsed_time": "6:19:32", "remaining_time": "0:11:19"}
|
738 |
+
{"current_steps": 738, "total_steps": 759, "loss": 0.3805, "lr": 2.3307690046527887e-08, "epoch": 2.915075707702436, "percentage": 97.23, "elapsed_time": "6:19:55", "remaining_time": "0:10:48"}
|
739 |
+
{"current_steps": 739, "total_steps": 759, "loss": 0.3699, "lr": 2.114229043375049e-08, "epoch": 2.9190256747860435, "percentage": 97.36, "elapsed_time": "6:20:19", "remaining_time": "0:10:17"}
|
740 |
+
{"current_steps": 740, "total_steps": 759, "loss": 0.3743, "lr": 1.9082229359127512e-08, "epoch": 2.922975641869651, "percentage": 97.5, "elapsed_time": "6:20:42", "remaining_time": "0:09:46"}
|
741 |
+
{"current_steps": 741, "total_steps": 759, "loss": 0.3597, "lr": 1.7127550407721184e-08, "epoch": 2.9269256089532587, "percentage": 97.63, "elapsed_time": "6:22:06", "remaining_time": "0:09:16"}
|
742 |
+
{"current_steps": 742, "total_steps": 759, "loss": 0.3519, "lr": 1.52782949350061e-08, "epoch": 2.9308755760368665, "percentage": 97.76, "elapsed_time": "6:22:29", "remaining_time": "0:08:45"}
|
743 |
+
{"current_steps": 741, "total_steps": 759, "loss": 0.3609, "lr": 1.7127550407721184e-08, "epoch": 2.9282422646477944, "percentage": 97.63, "elapsed_time": "0:00:44", "remaining_time": "0:00:01"}
|
744 |
+
{"current_steps": 742, "total_steps": 759, "loss": 0.3483, "lr": 1.52782949350061e-08, "epoch": 2.932192231731402, "percentage": 97.76, "elapsed_time": "0:01:08", "remaining_time": "0:00:01"}
|
745 |
+
{"current_steps": 743, "total_steps": 759, "loss": 0.3577, "lr": 1.3534502065993826e-08, "epoch": 2.93614219881501, "percentage": 97.89, "elapsed_time": "0:01:33", "remaining_time": "0:00:02"}
|
746 |
+
{"current_steps": 744, "total_steps": 759, "loss": 0.3537, "lr": 1.1896208694406886e-08, "epoch": 2.9400921658986174, "percentage": 98.02, "elapsed_time": "0:01:57", "remaining_time": "0:00:02"}
|
747 |
+
{"current_steps": 745, "total_steps": 759, "loss": 0.3611, "lr": 1.0363449481896604e-08, "epoch": 2.9440421329822253, "percentage": 98.16, "elapsed_time": "0:02:22", "remaining_time": "0:00:02"}
|
748 |
+
{"current_steps": 746, "total_steps": 759, "loss": 0.3369, "lr": 8.936256857308701e-09, "epoch": 2.9479921000658327, "percentage": 98.29, "elapsed_time": "0:02:47", "remaining_time": "0:00:02"}
|
749 |
+
{"current_steps": 747, "total_steps": 759, "loss": 0.3636, "lr": 7.614661016001056e-09, "epoch": 2.9519420671494405, "percentage": 98.42, "elapsed_time": "0:03:12", "remaining_time": "0:00:03"}
|
750 |
+
{"current_steps": 748, "total_steps": 759, "loss": 0.3549, "lr": 6.398689919201451e-09, "epoch": 2.955892034233048, "percentage": 98.55, "elapsed_time": "0:03:37", "remaining_time": "0:00:03"}
|
751 |
+
{"current_steps": 749, "total_steps": 759, "loss": 0.3502, "lr": 5.288369293415807e-09, "epoch": 2.9598420013166558, "percentage": 98.68, "elapsed_time": "0:04:03", "remaining_time": "0:00:03"}
|
752 |
+
{"current_steps": 750, "total_steps": 759, "loss": 0.36, "lr": 4.283722629887521e-09, "epoch": 2.9637919684002636, "percentage": 98.81, "elapsed_time": "0:04:28", "remaining_time": "0:00:03"}
|
753 |
+
{"current_steps": 751, "total_steps": 759, "loss": 0.3594, "lr": 3.3847711840950813e-09, "epoch": 2.967741935483871, "percentage": 98.95, "elapsed_time": "0:06:37", "remaining_time": "0:00:04"}
|
754 |
+
{"current_steps": 752, "total_steps": 759, "loss": 0.3745, "lr": 2.5915339753085355e-09, "epoch": 2.9716919025674784, "percentage": 99.08, "elapsed_time": "0:07:02", "remaining_time": "0:00:03"}
|
755 |
+
{"current_steps": 753, "total_steps": 759, "loss": 0.388, "lr": 1.9040277861814836e-09, "epoch": 2.9756418696510862, "percentage": 99.21, "elapsed_time": "0:07:27", "remaining_time": "0:00:03"}
|
756 |
+
{"current_steps": 754, "total_steps": 759, "loss": 0.3546, "lr": 1.3222671623991379e-09, "epoch": 2.979591836734694, "percentage": 99.34, "elapsed_time": "0:07:53", "remaining_time": "0:00:03"}
|
757 |
+
{"current_steps": 755, "total_steps": 759, "loss": 0.353, "lr": 8.462644123696794e-10, "epoch": 2.9835418038183015, "percentage": 99.47, "elapsed_time": "0:08:18", "remaining_time": "0:00:02"}
|
758 |
+
{"current_steps": 756, "total_steps": 759, "loss": 0.3509, "lr": 4.760296069639125e-10, "epoch": 2.9874917709019093, "percentage": 99.6, "elapsed_time": "0:08:44", "remaining_time": "0:00:02"}
|
759 |
+
{"current_steps": 757, "total_steps": 759, "loss": 0.355, "lr": 2.1157057930321079e-10, "epoch": 2.9914417379855167, "percentage": 99.74, "elapsed_time": "0:09:10", "remaining_time": "0:00:01"}
|
760 |
+
{"current_steps": 758, "total_steps": 759, "loss": 0.359, "lr": 5.289292459187412e-11, "epoch": 2.9953917050691246, "percentage": 99.87, "elapsed_time": "0:09:35", "remaining_time": "0:00:00"}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63a2dec218e4be041cea0ecb002e79aa9d239d8bc94e23b9041e85ad7f6808f0
|
3 |
+
size 7480
|