sedrickkeh
commited on
Commit
•
6609b17
1
Parent(s):
0688a31
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97d519403421af1f66fefdc27809f73eb1363a8801f6eadb3317f39ca0732c34
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98ad3fe8d4951738eec1dcd052a7abde56a2bb49592faceba0543499916e949c
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fea98f5ad28cd40e8a4427946849a7ff176794f9519691f8118676d3a019649
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a0a3716776c48d768b3742688d0b069334428102b4bdff4f39e484530b89e54
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -108,3 +108,56 @@
|
|
108 |
{"current_steps": 1070, "total_steps": 1617, "loss": 0.519, "lr": 5e-06, "epoch": 1.9846974263853467, "percentage": 66.17, "elapsed_time": "17:13:16", "remaining_time": "8:48:13"}
|
109 |
{"current_steps": 1078, "total_steps": 1617, "eval_loss": 0.5572099685668945, "epoch": 1.9995362856480408, "percentage": 66.67, "elapsed_time": "17:30:39", "remaining_time": "8:45:19"}
|
110 |
{"current_steps": 1080, "total_steps": 1617, "loss": 0.5612, "lr": 5e-06, "epoch": 2.0032460004637143, "percentage": 66.79, "elapsed_time": "17:33:34", "remaining_time": "8:43:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
108 |
{"current_steps": 1070, "total_steps": 1617, "loss": 0.519, "lr": 5e-06, "epoch": 1.9846974263853467, "percentage": 66.17, "elapsed_time": "17:13:16", "remaining_time": "8:48:13"}
|
109 |
{"current_steps": 1078, "total_steps": 1617, "eval_loss": 0.5572099685668945, "epoch": 1.9995362856480408, "percentage": 66.67, "elapsed_time": "17:30:39", "remaining_time": "8:45:19"}
|
110 |
{"current_steps": 1080, "total_steps": 1617, "loss": 0.5612, "lr": 5e-06, "epoch": 2.0032460004637143, "percentage": 66.79, "elapsed_time": "17:33:34", "remaining_time": "8:43:51"}
|
111 |
+
{"current_steps": 1090, "total_steps": 1617, "loss": 0.4796, "lr": 5e-06, "epoch": 2.0217945745420822, "percentage": 67.41, "elapsed_time": "17:43:09", "remaining_time": "8:34:01"}
|
112 |
+
{"current_steps": 1100, "total_steps": 1617, "loss": 0.4717, "lr": 5e-06, "epoch": 2.0403431486204497, "percentage": 68.03, "elapsed_time": "17:52:43", "remaining_time": "8:24:10"}
|
113 |
+
{"current_steps": 1110, "total_steps": 1617, "loss": 0.4705, "lr": 5e-06, "epoch": 2.0588917226988177, "percentage": 68.65, "elapsed_time": "18:02:17", "remaining_time": "8:14:20"}
|
114 |
+
{"current_steps": 1120, "total_steps": 1617, "loss": 0.4661, "lr": 5e-06, "epoch": 2.0774402967771852, "percentage": 69.26, "elapsed_time": "18:11:51", "remaining_time": "8:04:30"}
|
115 |
+
{"current_steps": 1130, "total_steps": 1617, "loss": 0.4674, "lr": 5e-06, "epoch": 2.095988870855553, "percentage": 69.88, "elapsed_time": "18:21:25", "remaining_time": "7:54:41"}
|
116 |
+
{"current_steps": 1140, "total_steps": 1617, "loss": 0.4645, "lr": 5e-06, "epoch": 2.1145374449339207, "percentage": 70.5, "elapsed_time": "18:30:59", "remaining_time": "7:44:51"}
|
117 |
+
{"current_steps": 1150, "total_steps": 1617, "loss": 0.4676, "lr": 5e-06, "epoch": 2.1330860190122882, "percentage": 71.12, "elapsed_time": "18:40:33", "remaining_time": "7:35:02"}
|
118 |
+
{"current_steps": 1160, "total_steps": 1617, "loss": 0.4657, "lr": 5e-06, "epoch": 2.151634593090656, "percentage": 71.74, "elapsed_time": "18:50:07", "remaining_time": "7:25:13"}
|
119 |
+
{"current_steps": 1170, "total_steps": 1617, "loss": 0.4656, "lr": 5e-06, "epoch": 2.1701831671690237, "percentage": 72.36, "elapsed_time": "18:59:40", "remaining_time": "7:15:24"}
|
120 |
+
{"current_steps": 1180, "total_steps": 1617, "loss": 0.4583, "lr": 5e-06, "epoch": 2.1887317412473917, "percentage": 72.97, "elapsed_time": "19:09:14", "remaining_time": "7:05:36"}
|
121 |
+
{"current_steps": 1190, "total_steps": 1617, "loss": 0.469, "lr": 5e-06, "epoch": 2.207280315325759, "percentage": 73.59, "elapsed_time": "19:18:47", "remaining_time": "6:55:48"}
|
122 |
+
{"current_steps": 1200, "total_steps": 1617, "loss": 0.4715, "lr": 5e-06, "epoch": 2.225828889404127, "percentage": 74.21, "elapsed_time": "19:28:21", "remaining_time": "6:46:00"}
|
123 |
+
{"current_steps": 1210, "total_steps": 1617, "loss": 0.4584, "lr": 5e-06, "epoch": 2.2443774634824947, "percentage": 74.83, "elapsed_time": "19:37:54", "remaining_time": "6:36:12"}
|
124 |
+
{"current_steps": 1220, "total_steps": 1617, "loss": 0.4772, "lr": 5e-06, "epoch": 2.2629260375608626, "percentage": 75.45, "elapsed_time": "19:47:28", "remaining_time": "6:26:24"}
|
125 |
+
{"current_steps": 1230, "total_steps": 1617, "loss": 0.4701, "lr": 5e-06, "epoch": 2.28147461163923, "percentage": 76.07, "elapsed_time": "19:57:01", "remaining_time": "6:16:37"}
|
126 |
+
{"current_steps": 1240, "total_steps": 1617, "loss": 0.4619, "lr": 5e-06, "epoch": 2.300023185717598, "percentage": 76.69, "elapsed_time": "20:06:35", "remaining_time": "6:06:50"}
|
127 |
+
{"current_steps": 1250, "total_steps": 1617, "loss": 0.4734, "lr": 5e-06, "epoch": 2.3185717597959656, "percentage": 77.3, "elapsed_time": "20:16:08", "remaining_time": "5:57:03"}
|
128 |
+
{"current_steps": 1260, "total_steps": 1617, "loss": 0.4746, "lr": 5e-06, "epoch": 2.3371203338743336, "percentage": 77.92, "elapsed_time": "20:25:43", "remaining_time": "5:47:17"}
|
129 |
+
{"current_steps": 1270, "total_steps": 1617, "loss": 0.4647, "lr": 5e-06, "epoch": 2.355668907952701, "percentage": 78.54, "elapsed_time": "20:35:16", "remaining_time": "5:37:30"}
|
130 |
+
{"current_steps": 1280, "total_steps": 1617, "loss": 0.459, "lr": 5e-06, "epoch": 2.374217482031069, "percentage": 79.16, "elapsed_time": "20:44:50", "remaining_time": "5:27:44"}
|
131 |
+
{"current_steps": 1290, "total_steps": 1617, "loss": 0.4687, "lr": 5e-06, "epoch": 2.3927660561094366, "percentage": 79.78, "elapsed_time": "20:54:24", "remaining_time": "5:17:58"}
|
132 |
+
{"current_steps": 1300, "total_steps": 1617, "loss": 0.4636, "lr": 5e-06, "epoch": 2.411314630187804, "percentage": 80.4, "elapsed_time": "21:03:58", "remaining_time": "5:08:12"}
|
133 |
+
{"current_steps": 1310, "total_steps": 1617, "loss": 0.4798, "lr": 5e-06, "epoch": 2.429863204266172, "percentage": 81.01, "elapsed_time": "21:13:32", "remaining_time": "4:58:27"}
|
134 |
+
{"current_steps": 1320, "total_steps": 1617, "loss": 0.4743, "lr": 5e-06, "epoch": 2.4484117783445396, "percentage": 81.63, "elapsed_time": "21:23:06", "remaining_time": "4:48:42"}
|
135 |
+
{"current_steps": 1330, "total_steps": 1617, "loss": 0.479, "lr": 5e-06, "epoch": 2.4669603524229076, "percentage": 82.25, "elapsed_time": "21:32:40", "remaining_time": "4:38:56"}
|
136 |
+
{"current_steps": 1340, "total_steps": 1617, "loss": 0.4667, "lr": 5e-06, "epoch": 2.485508926501275, "percentage": 82.87, "elapsed_time": "21:42:14", "remaining_time": "4:29:11"}
|
137 |
+
{"current_steps": 1350, "total_steps": 1617, "loss": 0.4756, "lr": 5e-06, "epoch": 2.504057500579643, "percentage": 83.49, "elapsed_time": "21:51:48", "remaining_time": "4:19:26"}
|
138 |
+
{"current_steps": 1360, "total_steps": 1617, "loss": 0.4656, "lr": 5e-06, "epoch": 2.5226060746580106, "percentage": 84.11, "elapsed_time": "22:01:22", "remaining_time": "4:09:42"}
|
139 |
+
{"current_steps": 1370, "total_steps": 1617, "loss": 0.4769, "lr": 5e-06, "epoch": 2.5411546487363785, "percentage": 84.72, "elapsed_time": "22:10:57", "remaining_time": "3:59:57"}
|
140 |
+
{"current_steps": 1380, "total_steps": 1617, "loss": 0.4715, "lr": 5e-06, "epoch": 2.559703222814746, "percentage": 85.34, "elapsed_time": "22:20:30", "remaining_time": "3:50:13"}
|
141 |
+
{"current_steps": 1390, "total_steps": 1617, "loss": 0.466, "lr": 5e-06, "epoch": 2.578251796893114, "percentage": 85.96, "elapsed_time": "22:30:05", "remaining_time": "3:40:28"}
|
142 |
+
{"current_steps": 1400, "total_steps": 1617, "loss": 0.4719, "lr": 5e-06, "epoch": 2.5968003709714815, "percentage": 86.58, "elapsed_time": "22:39:38", "remaining_time": "3:30:44"}
|
143 |
+
{"current_steps": 1410, "total_steps": 1617, "loss": 0.4657, "lr": 5e-06, "epoch": 2.615348945049849, "percentage": 87.2, "elapsed_time": "22:49:11", "remaining_time": "3:21:00"}
|
144 |
+
{"current_steps": 1420, "total_steps": 1617, "loss": 0.4649, "lr": 5e-06, "epoch": 2.633897519128217, "percentage": 87.82, "elapsed_time": "22:58:45", "remaining_time": "3:11:16"}
|
145 |
+
{"current_steps": 1430, "total_steps": 1617, "loss": 0.4734, "lr": 5e-06, "epoch": 2.652446093206585, "percentage": 88.44, "elapsed_time": "23:08:19", "remaining_time": "3:01:32"}
|
146 |
+
{"current_steps": 1440, "total_steps": 1617, "loss": 0.4696, "lr": 5e-06, "epoch": 2.6709946672849525, "percentage": 89.05, "elapsed_time": "23:17:52", "remaining_time": "2:51:49"}
|
147 |
+
{"current_steps": 1450, "total_steps": 1617, "loss": 0.4626, "lr": 5e-06, "epoch": 2.68954324136332, "percentage": 89.67, "elapsed_time": "23:27:26", "remaining_time": "2:42:05"}
|
148 |
+
{"current_steps": 1460, "total_steps": 1617, "loss": 0.4683, "lr": 5e-06, "epoch": 2.708091815441688, "percentage": 90.29, "elapsed_time": "23:36:59", "remaining_time": "2:32:22"}
|
149 |
+
{"current_steps": 1470, "total_steps": 1617, "loss": 0.4724, "lr": 5e-06, "epoch": 2.7266403895200555, "percentage": 90.91, "elapsed_time": "23:46:31", "remaining_time": "2:22:39"}
|
150 |
+
{"current_steps": 1480, "total_steps": 1617, "loss": 0.4756, "lr": 5e-06, "epoch": 2.7451889635984235, "percentage": 91.53, "elapsed_time": "23:56:05", "remaining_time": "2:12:56"}
|
151 |
+
{"current_steps": 1490, "total_steps": 1617, "loss": 0.4765, "lr": 5e-06, "epoch": 2.763737537676791, "percentage": 92.15, "elapsed_time": "1 day, 0:05:38", "remaining_time": "2:03:13"}
|
152 |
+
{"current_steps": 1500, "total_steps": 1617, "loss": 0.4798, "lr": 5e-06, "epoch": 2.782286111755159, "percentage": 92.76, "elapsed_time": "1 day, 0:15:11", "remaining_time": "1:53:30"}
|
153 |
+
{"current_steps": 1510, "total_steps": 1617, "loss": 0.4694, "lr": 5e-06, "epoch": 2.8008346858335265, "percentage": 93.38, "elapsed_time": "1 day, 0:24:45", "remaining_time": "1:43:47"}
|
154 |
+
{"current_steps": 1520, "total_steps": 1617, "loss": 0.4672, "lr": 5e-06, "epoch": 2.8193832599118944, "percentage": 94.0, "elapsed_time": "1 day, 0:34:18", "remaining_time": "1:34:05"}
|
155 |
+
{"current_steps": 1530, "total_steps": 1617, "loss": 0.4704, "lr": 5e-06, "epoch": 2.837931833990262, "percentage": 94.62, "elapsed_time": "1 day, 0:43:52", "remaining_time": "1:24:22"}
|
156 |
+
{"current_steps": 1540, "total_steps": 1617, "loss": 0.4795, "lr": 5e-06, "epoch": 2.85648040806863, "percentage": 95.24, "elapsed_time": "1 day, 0:53:25", "remaining_time": "1:14:40"}
|
157 |
+
{"current_steps": 1550, "total_steps": 1617, "loss": 0.4626, "lr": 5e-06, "epoch": 2.8750289821469974, "percentage": 95.86, "elapsed_time": "1 day, 1:02:59", "remaining_time": "1:04:58"}
|
158 |
+
{"current_steps": 1560, "total_steps": 1617, "loss": 0.4767, "lr": 5e-06, "epoch": 2.893577556225365, "percentage": 96.47, "elapsed_time": "1 day, 1:12:32", "remaining_time": "0:55:15"}
|
159 |
+
{"current_steps": 1570, "total_steps": 1617, "loss": 0.4681, "lr": 5e-06, "epoch": 2.912126130303733, "percentage": 97.09, "elapsed_time": "1 day, 1:22:05", "remaining_time": "0:45:33"}
|
160 |
+
{"current_steps": 1580, "total_steps": 1617, "loss": 0.4732, "lr": 5e-06, "epoch": 2.930674704382101, "percentage": 97.71, "elapsed_time": "1 day, 1:31:39", "remaining_time": "0:35:52"}
|
161 |
+
{"current_steps": 1590, "total_steps": 1617, "loss": 0.4732, "lr": 5e-06, "epoch": 2.9492232784604684, "percentage": 98.33, "elapsed_time": "1 day, 1:41:12", "remaining_time": "0:26:10"}
|
162 |
+
{"current_steps": 1600, "total_steps": 1617, "loss": 0.4713, "lr": 5e-06, "epoch": 2.967771852538836, "percentage": 98.95, "elapsed_time": "1 day, 1:50:45", "remaining_time": "0:16:28"}
|
163 |
+
{"current_steps": 1610, "total_steps": 1617, "loss": 0.469, "lr": 5e-06, "epoch": 2.986320426617204, "percentage": 99.57, "elapsed_time": "1 day, 2:00:19", "remaining_time": "0:06:47"}
|