geshijoker
commited on
Training in progress, step 1000
Browse files
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 671149168
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b402f011cae2465741e7257dd25811cc43d8065bb16a0d52921d63125728815
|
3 |
size 671149168
|
runs/Dec29_06-04-47_64-181-222-101/events.out.tfevents.1735452702.64-181-222-101.26519.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9a3e6404b78d3bbe378285f2c5f0b051c6807e6f0a9c43b28d1db5b2d52bf90
|
3 |
+
size 26678
|
trainer_log.jsonl
CHANGED
@@ -48,3 +48,54 @@
|
|
48 |
{"current_steps": 480, "total_steps": 1053, "loss": 1.7693, "lr": 3.068328039116616e-05, "epoch": 1.3650906505510132, "percentage": 45.58, "elapsed_time": "1:36:07", "remaining_time": "1:54:45"}
|
49 |
{"current_steps": 490, "total_steps": 1053, "loss": 1.7712, "lr": 2.99157673653855e-05, "epoch": 1.3935300391041592, "percentage": 46.53, "elapsed_time": "1:38:04", "remaining_time": "1:52:40"}
|
50 |
{"current_steps": 500, "total_steps": 1053, "loss": 1.7613, "lr": 2.9143403070702997e-05, "epoch": 1.4219694276573054, "percentage": 47.48, "elapsed_time": "1:40:05", "remaining_time": "1:50:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
{"current_steps": 480, "total_steps": 1053, "loss": 1.7693, "lr": 3.068328039116616e-05, "epoch": 1.3650906505510132, "percentage": 45.58, "elapsed_time": "1:36:07", "remaining_time": "1:54:45"}
|
49 |
{"current_steps": 490, "total_steps": 1053, "loss": 1.7712, "lr": 2.99157673653855e-05, "epoch": 1.3935300391041592, "percentage": 46.53, "elapsed_time": "1:38:04", "remaining_time": "1:52:40"}
|
50 |
{"current_steps": 500, "total_steps": 1053, "loss": 1.7613, "lr": 2.9143403070702997e-05, "epoch": 1.4219694276573054, "percentage": 47.48, "elapsed_time": "1:40:05", "remaining_time": "1:50:42"}
|
51 |
+
{"current_steps": 510, "total_steps": 1053, "loss": 1.7729, "lr": 2.8366949737428817e-05, "epoch": 1.4504088162104516, "percentage": 48.43, "elapsed_time": "1:42:10", "remaining_time": "1:48:47"}
|
52 |
+
{"current_steps": 520, "total_steps": 1053, "loss": 1.7649, "lr": 2.7587173631260566e-05, "epoch": 1.4788482047635976, "percentage": 49.38, "elapsed_time": "1:44:07", "remaining_time": "1:46:43"}
|
53 |
+
{"current_steps": 530, "total_steps": 1053, "loss": 1.747, "lr": 2.6804844297071526e-05, "epoch": 1.5072875933167436, "percentage": 50.33, "elapsed_time": "1:46:10", "remaining_time": "1:44:45"}
|
54 |
+
{"current_steps": 540, "total_steps": 1053, "loss": 1.7496, "lr": 2.6020733799462754e-05, "epoch": 1.5357269818698898, "percentage": 51.28, "elapsed_time": "1:48:06", "remaining_time": "1:42:42"}
|
55 |
+
{"current_steps": 550, "total_steps": 1053, "loss": 1.7517, "lr": 2.5235615960828605e-05, "epoch": 1.564166370423036, "percentage": 52.23, "elapsed_time": "1:50:10", "remaining_time": "1:40:45"}
|
56 |
+
{"current_steps": 560, "total_steps": 1053, "loss": 1.7768, "lr": 2.4450265597687376e-05, "epoch": 1.5926057589761822, "percentage": 53.18, "elapsed_time": "1:52:12", "remaining_time": "1:38:46"}
|
57 |
+
{"current_steps": 570, "total_steps": 1053, "loss": 1.7369, "lr": 2.3665457756030988e-05, "epoch": 1.6210451475293282, "percentage": 54.13, "elapsed_time": "1:54:11", "remaining_time": "1:36:45"}
|
58 |
+
{"current_steps": 580, "total_steps": 1053, "loss": 1.7389, "lr": 2.2881966946448167e-05, "epoch": 1.6494845360824741, "percentage": 55.08, "elapsed_time": "1:56:12", "remaining_time": "1:34:46"}
|
59 |
+
{"current_steps": 590, "total_steps": 1053, "loss": 1.7364, "lr": 2.2100566379775967e-05, "epoch": 1.6779239246356203, "percentage": 56.03, "elapsed_time": "1:58:11", "remaining_time": "1:32:44"}
|
60 |
+
{"current_steps": 600, "total_steps": 1053, "loss": 1.7447, "lr": 2.1322027204034066e-05, "epoch": 1.7063633131887666, "percentage": 56.98, "elapsed_time": "2:00:12", "remaining_time": "1:30:45"}
|
61 |
+
{"current_steps": 610, "total_steps": 1053, "loss": 1.7647, "lr": 2.0547117743394744e-05, "epoch": 1.7348027017419125, "percentage": 57.93, "elapsed_time": "2:02:12", "remaining_time": "1:28:44"}
|
62 |
+
{"current_steps": 620, "total_steps": 1053, "loss": 1.7343, "lr": 1.9776602739939714e-05, "epoch": 1.7632420902950585, "percentage": 58.88, "elapsed_time": "2:04:14", "remaining_time": "1:26:46"}
|
63 |
+
{"current_steps": 630, "total_steps": 1053, "loss": 1.7402, "lr": 1.9011242598951962e-05, "epoch": 1.7916814788482047, "percentage": 59.83, "elapsed_time": "2:06:17", "remaining_time": "1:24:47"}
|
64 |
+
{"current_steps": 640, "total_steps": 1053, "loss": 1.7421, "lr": 1.8251792638487596e-05, "epoch": 1.820120867401351, "percentage": 60.78, "elapsed_time": "2:08:16", "remaining_time": "1:22:46"}
|
65 |
+
{"current_steps": 650, "total_steps": 1053, "loss": 1.7303, "lr": 1.7499002343968098e-05, "epoch": 1.8485602559544971, "percentage": 61.73, "elapsed_time": "2:10:10", "remaining_time": "1:20:42"}
|
66 |
+
{"current_steps": 660, "total_steps": 1053, "loss": 1.7236, "lr": 1.675361462852868e-05, "epoch": 1.8769996445076431, "percentage": 62.68, "elapsed_time": "2:12:18", "remaining_time": "1:18:46"}
|
67 |
+
{"current_steps": 670, "total_steps": 1053, "loss": 1.7163, "lr": 1.6016365099852735e-05, "epoch": 1.905439033060789, "percentage": 63.63, "elapsed_time": "2:14:21", "remaining_time": "1:16:48"}
|
68 |
+
{"current_steps": 680, "total_steps": 1053, "loss": 1.7253, "lr": 1.528798133421585e-05, "epoch": 1.9338784216139353, "percentage": 64.58, "elapsed_time": "2:16:19", "remaining_time": "1:14:46"}
|
69 |
+
{"current_steps": 690, "total_steps": 1053, "loss": 1.7054, "lr": 1.4569182158455875e-05, "epoch": 1.9623178101670815, "percentage": 65.53, "elapsed_time": "2:18:17", "remaining_time": "1:12:45"}
|
70 |
+
{"current_steps": 700, "total_steps": 1053, "loss": 1.7469, "lr": 1.3860676940577594e-05, "epoch": 1.9907571987202275, "percentage": 66.48, "elapsed_time": "2:20:23", "remaining_time": "1:10:47"}
|
71 |
+
{"current_steps": 710, "total_steps": 1053, "loss": 1.7598, "lr": 1.3163164889692197e-05, "epoch": 2.0191965872733735, "percentage": 67.43, "elapsed_time": "2:22:24", "remaining_time": "1:08:47"}
|
72 |
+
{"current_steps": 720, "total_steps": 1053, "loss": 1.6736, "lr": 1.2477334365982248e-05, "epoch": 2.0476359758265197, "percentage": 68.38, "elapsed_time": "2:24:22", "remaining_time": "1:06:46"}
|
73 |
+
{"current_steps": 730, "total_steps": 1053, "loss": 1.6529, "lr": 1.1803862201373342e-05, "epoch": 2.076075364379666, "percentage": 69.33, "elapsed_time": "2:26:24", "remaining_time": "1:04:46"}
|
74 |
+
{"current_steps": 740, "total_steps": 1053, "loss": 1.6734, "lr": 1.1143413031582645e-05, "epoch": 2.104514752932812, "percentage": 70.28, "elapsed_time": "2:28:26", "remaining_time": "1:02:47"}
|
75 |
+
{"current_steps": 750, "total_steps": 1053, "loss": 1.6702, "lr": 1.0496638640203774e-05, "epoch": 2.132954141485958, "percentage": 71.23, "elapsed_time": "2:30:22", "remaining_time": "1:00:44"}
|
76 |
+
{"current_steps": 760, "total_steps": 1053, "loss": 1.6613, "lr": 9.864177315474968e-06, "epoch": 2.161393530039104, "percentage": 72.17, "elapsed_time": "2:32:22", "remaining_time": "0:58:44"}
|
77 |
+
{"current_steps": 770, "total_steps": 1053, "loss": 1.6898, "lr": 9.246653220365778e-06, "epoch": 2.1898329185922503, "percentage": 73.12, "elapsed_time": "2:34:25", "remaining_time": "0:56:45"}
|
78 |
+
{"current_steps": 780, "total_steps": 1053, "loss": 1.6688, "lr": 8.644675776603476e-06, "epoch": 2.2182723071453965, "percentage": 74.07, "elapsed_time": "2:36:25", "remaining_time": "0:54:45"}
|
79 |
+
{"current_steps": 790, "total_steps": 1053, "loss": 1.6761, "lr": 8.058839063247447e-06, "epoch": 2.2467116956985427, "percentage": 75.02, "elapsed_time": "2:38:28", "remaining_time": "0:52:45"}
|
80 |
+
{"current_steps": 800, "total_steps": 1053, "loss": 1.7022, "lr": 7.489721230404842e-06, "epoch": 2.2751510842516884, "percentage": 75.97, "elapsed_time": "2:40:28", "remaining_time": "0:50:44"}
|
81 |
+
{"current_steps": 810, "total_steps": 1053, "loss": 1.6778, "lr": 6.937883928666255e-06, "epoch": 2.3035904728048346, "percentage": 76.92, "elapsed_time": "2:42:33", "remaining_time": "0:48:46"}
|
82 |
+
{"current_steps": 820, "total_steps": 1053, "loss": 1.6517, "lr": 6.403871754824373e-06, "epoch": 2.332029861357981, "percentage": 77.87, "elapsed_time": "2:44:28", "remaining_time": "0:46:44"}
|
83 |
+
{"current_steps": 830, "total_steps": 1053, "loss": 1.6696, "lr": 5.8882117144227115e-06, "epoch": 2.360469249911127, "percentage": 78.82, "elapsed_time": "2:46:26", "remaining_time": "0:44:43"}
|
84 |
+
{"current_steps": 840, "total_steps": 1053, "loss": 1.6452, "lr": 5.391412701664744e-06, "epoch": 2.3889086384642733, "percentage": 79.77, "elapsed_time": "2:48:29", "remaining_time": "0:42:43"}
|
85 |
+
{"current_steps": 850, "total_steps": 1053, "loss": 1.6739, "lr": 4.91396499719681e-06, "epoch": 2.417348027017419, "percentage": 80.72, "elapsed_time": "2:50:32", "remaining_time": "0:40:43"}
|
86 |
+
{"current_steps": 860, "total_steps": 1053, "loss": 1.6582, "lr": 4.456339784260247e-06, "epoch": 2.4457874155705652, "percentage": 81.67, "elapsed_time": "2:52:32", "remaining_time": "0:38:43"}
|
87 |
+
{"current_steps": 870, "total_steps": 1053, "loss": 1.6483, "lr": 4.018988683690461e-06, "epoch": 2.4742268041237114, "percentage": 82.62, "elapsed_time": "2:54:30", "remaining_time": "0:36:42"}
|
88 |
+
{"current_steps": 880, "total_steps": 1053, "loss": 1.6731, "lr": 3.6023433082216755e-06, "epoch": 2.502666192676857, "percentage": 83.57, "elapsed_time": "2:56:33", "remaining_time": "0:34:42"}
|
89 |
+
{"current_steps": 890, "total_steps": 1053, "loss": 1.6705, "lr": 3.2068148365372806e-06, "epoch": 2.5311055812300034, "percentage": 84.52, "elapsed_time": "2:58:28", "remaining_time": "0:32:41"}
|
90 |
+
{"current_steps": 900, "total_steps": 1053, "loss": 1.6851, "lr": 2.832793607486087e-06, "epoch": 2.5595449697831496, "percentage": 85.47, "elapsed_time": "3:00:29", "remaining_time": "0:30:41"}
|
91 |
+
{"current_steps": 910, "total_steps": 1053, "loss": 1.6464, "lr": 2.4806487348650485e-06, "epoch": 2.587984358336296, "percentage": 86.42, "elapsed_time": "3:02:27", "remaining_time": "0:28:40"}
|
92 |
+
{"current_steps": 920, "total_steps": 1053, "loss": 1.6576, "lr": 2.150727743148473e-06, "epoch": 2.616423746889442, "percentage": 87.37, "elapsed_time": "3:04:25", "remaining_time": "0:26:39"}
|
93 |
+
{"current_steps": 930, "total_steps": 1053, "loss": 1.6304, "lr": 1.8433562245233349e-06, "epoch": 2.6448631354425878, "percentage": 88.32, "elapsed_time": "3:06:26", "remaining_time": "0:24:39"}
|
94 |
+
{"current_steps": 940, "total_steps": 1053, "loss": 1.6674, "lr": 1.5588375175691117e-06, "epoch": 2.673302523995734, "percentage": 89.27, "elapsed_time": "3:08:29", "remaining_time": "0:22:39"}
|
95 |
+
{"current_steps": 950, "total_steps": 1053, "loss": 1.6493, "lr": 1.2974524078991995e-06, "epoch": 2.70174191254888, "percentage": 90.22, "elapsed_time": "3:10:29", "remaining_time": "0:20:39"}
|
96 |
+
{"current_steps": 960, "total_steps": 1053, "loss": 1.6529, "lr": 1.0594588510594445e-06, "epoch": 2.7301813011020264, "percentage": 91.17, "elapsed_time": "3:12:29", "remaining_time": "0:18:38"}
|
97 |
+
{"current_steps": 970, "total_steps": 1053, "loss": 1.6612, "lr": 8.450917179571305e-07, "epoch": 2.7586206896551726, "percentage": 92.12, "elapsed_time": "3:14:26", "remaining_time": "0:16:38"}
|
98 |
+
{"current_steps": 980, "total_steps": 1053, "loss": 1.6637, "lr": 6.545625630717783e-07, "epoch": 2.7870600782083184, "percentage": 93.07, "elapsed_time": "3:16:27", "remaining_time": "0:14:38"}
|
99 |
+
{"current_steps": 990, "total_steps": 1053, "loss": 1.6784, "lr": 4.880594156763896e-07, "epoch": 2.8154994667614646, "percentage": 94.02, "elapsed_time": "3:18:25", "remaining_time": "0:12:37"}
|
100 |
+
{"current_steps": 1000, "total_steps": 1053, "loss": 1.6679, "lr": 3.4574659427528133e-07, "epoch": 2.8439388553146108, "percentage": 94.97, "elapsed_time": "3:20:25", "remaining_time": "0:10:37"}
|
101 |
+
{"current_steps": 1000, "total_steps": 1053, "eval_loss": 1.758003830909729, "epoch": 2.8439388553146108, "percentage": 94.97, "elapsed_time": "3:23:26", "remaining_time": "0:10:46"}
|