Rakancorle1
commited on
Commit
•
664f2da
1
Parent(s):
3dbd63c
Training in progress, step 1875
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +38 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 42002584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb6c73e7038e47b4b96c031b683047e39844064279265e204f25f051056d740b
|
3 |
size 42002584
|
trainer_log.jsonl
CHANGED
@@ -148,3 +148,41 @@
|
|
148 |
{"current_steps": 1480, "total_steps": 1875, "loss": 0.2677, "lr": 1.0556519461023301e-05, "epoch": 2.368, "percentage": 78.93, "elapsed_time": "3:29:14", "remaining_time": "0:55:50"}
|
149 |
{"current_steps": 1490, "total_steps": 1875, "loss": 0.2821, "lr": 1.0047226923189024e-05, "epoch": 2.384, "percentage": 79.47, "elapsed_time": "3:30:38", "remaining_time": "0:54:25"}
|
150 |
{"current_steps": 1500, "total_steps": 1875, "loss": 0.2628, "lr": 9.549150281252633e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "3:32:02", "remaining_time": "0:53:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
148 |
{"current_steps": 1480, "total_steps": 1875, "loss": 0.2677, "lr": 1.0556519461023301e-05, "epoch": 2.368, "percentage": 78.93, "elapsed_time": "3:29:14", "remaining_time": "0:55:50"}
|
149 |
{"current_steps": 1490, "total_steps": 1875, "loss": 0.2821, "lr": 1.0047226923189024e-05, "epoch": 2.384, "percentage": 79.47, "elapsed_time": "3:30:38", "remaining_time": "0:54:25"}
|
150 |
{"current_steps": 1500, "total_steps": 1875, "loss": 0.2628, "lr": 9.549150281252633e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "3:32:02", "remaining_time": "0:53:00"}
|
151 |
+
{"current_steps": 1510, "total_steps": 1875, "loss": 0.2648, "lr": 9.06242935969528e-06, "epoch": 2.416, "percentage": 80.53, "elapsed_time": "3:33:36", "remaining_time": "0:51:38"}
|
152 |
+
{"current_steps": 1520, "total_steps": 1875, "loss": 0.2718, "lr": 8.587200795119793e-06, "epoch": 2.432, "percentage": 81.07, "elapsed_time": "3:35:00", "remaining_time": "0:50:13"}
|
153 |
+
{"current_steps": 1530, "total_steps": 1875, "loss": 0.2779, "lr": 8.123597997892918e-06, "epoch": 2.448, "percentage": 81.6, "elapsed_time": "3:36:25", "remaining_time": "0:48:48"}
|
154 |
+
{"current_steps": 1540, "total_steps": 1875, "loss": 0.2522, "lr": 7.671751114693104e-06, "epoch": 2.464, "percentage": 82.13, "elapsed_time": "3:37:50", "remaining_time": "0:47:23"}
|
155 |
+
{"current_steps": 1550, "total_steps": 1875, "loss": 0.2668, "lr": 7.2317869919746705e-06, "epoch": 2.48, "percentage": 82.67, "elapsed_time": "3:39:14", "remaining_time": "0:45:58"}
|
156 |
+
{"current_steps": 1560, "total_steps": 1875, "loss": 0.2582, "lr": 6.803829140358237e-06, "epoch": 2.496, "percentage": 83.2, "elapsed_time": "3:40:38", "remaining_time": "0:44:33"}
|
157 |
+
{"current_steps": 1570, "total_steps": 1875, "loss": 0.2509, "lr": 6.3879976999578154e-06, "epoch": 2.512, "percentage": 83.73, "elapsed_time": "3:42:02", "remaining_time": "0:43:08"}
|
158 |
+
{"current_steps": 1580, "total_steps": 1875, "loss": 0.2743, "lr": 5.98440940665399e-06, "epoch": 2.528, "percentage": 84.27, "elapsed_time": "3:43:26", "remaining_time": "0:41:43"}
|
159 |
+
{"current_steps": 1590, "total_steps": 1875, "loss": 0.2833, "lr": 5.593177559322777e-06, "epoch": 2.544, "percentage": 84.8, "elapsed_time": "3:44:49", "remaining_time": "0:40:17"}
|
160 |
+
{"current_steps": 1600, "total_steps": 1875, "loss": 0.2693, "lr": 5.214411988029355e-06, "epoch": 2.56, "percentage": 85.33, "elapsed_time": "3:46:12", "remaining_time": "0:38:52"}
|
161 |
+
{"current_steps": 1610, "total_steps": 1875, "loss": 0.2607, "lr": 4.848219023195644e-06, "epoch": 2.576, "percentage": 85.87, "elapsed_time": "3:47:35", "remaining_time": "0:37:27"}
|
162 |
+
{"current_steps": 1620, "total_steps": 1875, "loss": 0.2632, "lr": 4.494701465750217e-06, "epoch": 2.592, "percentage": 86.4, "elapsed_time": "3:48:59", "remaining_time": "0:36:02"}
|
163 |
+
{"current_steps": 1630, "total_steps": 1875, "loss": 0.2573, "lr": 4.153958558269189e-06, "epoch": 2.608, "percentage": 86.93, "elapsed_time": "3:50:22", "remaining_time": "0:34:37"}
|
164 |
+
{"current_steps": 1640, "total_steps": 1875, "loss": 0.2411, "lr": 3.826085957115888e-06, "epoch": 2.624, "percentage": 87.47, "elapsed_time": "3:51:45", "remaining_time": "0:33:12"}
|
165 |
+
{"current_steps": 1650, "total_steps": 1875, "loss": 0.2601, "lr": 3.511175705587433e-06, "epoch": 2.64, "percentage": 88.0, "elapsed_time": "3:53:08", "remaining_time": "0:31:47"}
|
166 |
+
{"current_steps": 1660, "total_steps": 1875, "loss": 0.2832, "lr": 3.2093162080754637e-06, "epoch": 2.656, "percentage": 88.53, "elapsed_time": "3:54:32", "remaining_time": "0:30:22"}
|
167 |
+
{"current_steps": 1670, "total_steps": 1875, "loss": 0.2725, "lr": 2.9205922052484958e-06, "epoch": 2.672, "percentage": 89.07, "elapsed_time": "3:55:55", "remaining_time": "0:28:57"}
|
168 |
+
{"current_steps": 1680, "total_steps": 1875, "loss": 0.2654, "lr": 2.6450847502627884e-06, "epoch": 2.6879999999999997, "percentage": 89.6, "elapsed_time": "3:57:18", "remaining_time": "0:27:32"}
|
169 |
+
{"current_steps": 1690, "total_steps": 1875, "loss": 0.2784, "lr": 2.3828711860083674e-06, "epoch": 2.7039999999999997, "percentage": 90.13, "elapsed_time": "3:58:41", "remaining_time": "0:26:07"}
|
170 |
+
{"current_steps": 1700, "total_steps": 1875, "loss": 0.2758, "lr": 2.134025123396638e-06, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "4:00:05", "remaining_time": "0:24:42"}
|
171 |
+
{"current_steps": 1710, "total_steps": 1875, "loss": 0.2533, "lr": 1.8986164206957035e-06, "epoch": 2.7359999999999998, "percentage": 91.2, "elapsed_time": "4:01:28", "remaining_time": "0:23:17"}
|
172 |
+
{"current_steps": 1720, "total_steps": 1875, "loss": 0.268, "lr": 1.6767111639191202e-06, "epoch": 2.752, "percentage": 91.73, "elapsed_time": "4:02:51", "remaining_time": "0:21:53"}
|
173 |
+
{"current_steps": 1730, "total_steps": 1875, "loss": 0.28, "lr": 1.4683716482736366e-06, "epoch": 2.768, "percentage": 92.27, "elapsed_time": "4:04:14", "remaining_time": "0:20:28"}
|
174 |
+
{"current_steps": 1740, "total_steps": 1875, "loss": 0.2797, "lr": 1.2736563606711382e-06, "epoch": 2.784, "percentage": 92.8, "elapsed_time": "4:05:37", "remaining_time": "0:19:03"}
|
175 |
+
{"current_steps": 1750, "total_steps": 1875, "loss": 0.2831, "lr": 1.0926199633097157e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "4:07:00", "remaining_time": "0:17:38"}
|
176 |
+
{"current_steps": 1760, "total_steps": 1875, "loss": 0.2558, "lr": 9.253132783283547e-07, "epoch": 2.816, "percentage": 93.87, "elapsed_time": "4:08:23", "remaining_time": "0:16:13"}
|
177 |
+
{"current_steps": 1770, "total_steps": 1875, "loss": 0.2635, "lr": 7.717832735397335e-07, "epoch": 2.832, "percentage": 94.4, "elapsed_time": "4:09:48", "remaining_time": "0:14:49"}
|
178 |
+
{"current_steps": 1780, "total_steps": 1875, "loss": 0.2639, "lr": 6.3207304924498e-07, "epoch": 2.848, "percentage": 94.93, "elapsed_time": "4:11:12", "remaining_time": "0:13:24"}
|
179 |
+
{"current_steps": 1790, "total_steps": 1875, "loss": 0.2532, "lr": 5.062218261342122e-07, "epoch": 2.864, "percentage": 95.47, "elapsed_time": "4:12:36", "remaining_time": "0:11:59"}
|
180 |
+
{"current_steps": 1800, "total_steps": 1875, "loss": 0.2327, "lr": 3.9426493427611177e-07, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "4:14:00", "remaining_time": "0:10:35"}
|
181 |
+
{"current_steps": 1810, "total_steps": 1875, "loss": 0.2621, "lr": 2.962338031997691e-07, "epoch": 2.896, "percentage": 96.53, "elapsed_time": "4:15:23", "remaining_time": "0:09:10"}
|
182 |
+
{"current_steps": 1820, "total_steps": 1875, "loss": 0.256, "lr": 2.1215595307154667e-07, "epoch": 2.912, "percentage": 97.07, "elapsed_time": "4:16:47", "remaining_time": "0:07:45"}
|
183 |
+
{"current_steps": 1830, "total_steps": 1875, "loss": 0.2545, "lr": 1.420549869693033e-07, "epoch": 2.928, "percentage": 97.6, "elapsed_time": "4:18:11", "remaining_time": "0:06:20"}
|
184 |
+
{"current_steps": 1840, "total_steps": 1875, "loss": 0.2596, "lr": 8.595058425640013e-08, "epoch": 2.944, "percentage": 98.13, "elapsed_time": "4:19:34", "remaining_time": "0:04:56"}
|
185 |
+
{"current_steps": 1850, "total_steps": 1875, "loss": 0.2584, "lr": 4.385849505708084e-08, "epoch": 2.96, "percentage": 98.67, "elapsed_time": "4:20:58", "remaining_time": "0:03:31"}
|
186 |
+
{"current_steps": 1860, "total_steps": 1875, "loss": 0.2752, "lr": 1.5790535835003008e-08, "epoch": 2.976, "percentage": 99.2, "elapsed_time": "4:22:21", "remaining_time": "0:02:06"}
|
187 |
+
{"current_steps": 1870, "total_steps": 1875, "loss": 0.2778, "lr": 1.7545860759693445e-09, "epoch": 2.992, "percentage": 99.73, "elapsed_time": "4:23:45", "remaining_time": "0:00:42"}
|
188 |
+
{"current_steps": 1875, "total_steps": 1875, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "4:24:37", "remaining_time": "0:00:00"}
|