Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec89692a818ad439916e22c1eff80e73d815962c5a3e3e8037c000021c3fe804
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e9f951e5e74f68af24346bf8596298573129bbd76ff8483159a022eab81a276
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2afed67938a4ce85df8163657d48ca549d23c811372484b6369c9044286ef05
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee1a3f51edb5a10ed40b50da52f0743de34cb10f236739b907f4e67fbc4016f8
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -79,3 +79,41 @@
|
|
79 |
{"current_steps": 770, "total_steps": 1152, "loss": 0.2117, "learning_rate": 5e-06, "epoch": 2.0052083333333335, "percentage": 66.84, "elapsed_time": "1:19:19", "remaining_time": "0:39:21"}
|
80 |
{"current_steps": 780, "total_steps": 1152, "loss": 0.1945, "learning_rate": 5e-06, "epoch": 2.03125, "percentage": 67.71, "elapsed_time": "1:20:18", "remaining_time": "0:38:17"}
|
81 |
{"current_steps": 790, "total_steps": 1152, "loss": 0.1941, "learning_rate": 5e-06, "epoch": 2.0572916666666665, "percentage": 68.58, "elapsed_time": "1:21:16", "remaining_time": "0:37:14"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
79 |
{"current_steps": 770, "total_steps": 1152, "loss": 0.2117, "learning_rate": 5e-06, "epoch": 2.0052083333333335, "percentage": 66.84, "elapsed_time": "1:19:19", "remaining_time": "0:39:21"}
|
80 |
{"current_steps": 780, "total_steps": 1152, "loss": 0.1945, "learning_rate": 5e-06, "epoch": 2.03125, "percentage": 67.71, "elapsed_time": "1:20:18", "remaining_time": "0:38:17"}
|
81 |
{"current_steps": 790, "total_steps": 1152, "loss": 0.1941, "learning_rate": 5e-06, "epoch": 2.0572916666666665, "percentage": 68.58, "elapsed_time": "1:21:16", "remaining_time": "0:37:14"}
|
82 |
+
{"current_steps": 800, "total_steps": 1152, "loss": 0.1957, "learning_rate": 5e-06, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "1:22:14", "remaining_time": "0:36:11"}
|
83 |
+
{"current_steps": 810, "total_steps": 1152, "loss": 0.1955, "learning_rate": 5e-06, "epoch": 2.109375, "percentage": 70.31, "elapsed_time": "1:23:12", "remaining_time": "0:35:08"}
|
84 |
+
{"current_steps": 820, "total_steps": 1152, "loss": 0.1918, "learning_rate": 5e-06, "epoch": 2.1354166666666665, "percentage": 71.18, "elapsed_time": "1:24:11", "remaining_time": "0:34:05"}
|
85 |
+
{"current_steps": 830, "total_steps": 1152, "loss": 0.1938, "learning_rate": 5e-06, "epoch": 2.1614583333333335, "percentage": 72.05, "elapsed_time": "1:25:09", "remaining_time": "0:33:02"}
|
86 |
+
{"current_steps": 840, "total_steps": 1152, "loss": 0.1951, "learning_rate": 5e-06, "epoch": 2.1875, "percentage": 72.92, "elapsed_time": "1:26:07", "remaining_time": "0:31:59"}
|
87 |
+
{"current_steps": 850, "total_steps": 1152, "loss": 0.1967, "learning_rate": 5e-06, "epoch": 2.2135416666666665, "percentage": 73.78, "elapsed_time": "1:27:05", "remaining_time": "0:30:56"}
|
88 |
+
{"current_steps": 860, "total_steps": 1152, "loss": 0.1941, "learning_rate": 5e-06, "epoch": 2.2395833333333335, "percentage": 74.65, "elapsed_time": "1:28:03", "remaining_time": "0:29:54"}
|
89 |
+
{"current_steps": 870, "total_steps": 1152, "loss": 0.1949, "learning_rate": 5e-06, "epoch": 2.265625, "percentage": 75.52, "elapsed_time": "1:29:02", "remaining_time": "0:28:51"}
|
90 |
+
{"current_steps": 880, "total_steps": 1152, "loss": 0.1964, "learning_rate": 5e-06, "epoch": 2.2916666666666665, "percentage": 76.39, "elapsed_time": "1:30:00", "remaining_time": "0:27:49"}
|
91 |
+
{"current_steps": 890, "total_steps": 1152, "loss": 0.1959, "learning_rate": 5e-06, "epoch": 2.3177083333333335, "percentage": 77.26, "elapsed_time": "1:30:58", "remaining_time": "0:26:46"}
|
92 |
+
{"current_steps": 900, "total_steps": 1152, "loss": 0.1929, "learning_rate": 5e-06, "epoch": 2.34375, "percentage": 78.12, "elapsed_time": "1:31:56", "remaining_time": "0:25:44"}
|
93 |
+
{"current_steps": 910, "total_steps": 1152, "loss": 0.193, "learning_rate": 5e-06, "epoch": 2.3697916666666665, "percentage": 78.99, "elapsed_time": "1:32:54", "remaining_time": "0:24:42"}
|
94 |
+
{"current_steps": 920, "total_steps": 1152, "loss": 0.1961, "learning_rate": 5e-06, "epoch": 2.3958333333333335, "percentage": 79.86, "elapsed_time": "1:33:53", "remaining_time": "0:23:40"}
|
95 |
+
{"current_steps": 930, "total_steps": 1152, "loss": 0.1955, "learning_rate": 5e-06, "epoch": 2.421875, "percentage": 80.73, "elapsed_time": "1:34:51", "remaining_time": "0:22:38"}
|
96 |
+
{"current_steps": 940, "total_steps": 1152, "loss": 0.1971, "learning_rate": 5e-06, "epoch": 2.4479166666666665, "percentage": 81.6, "elapsed_time": "1:35:49", "remaining_time": "0:21:36"}
|
97 |
+
{"current_steps": 950, "total_steps": 1152, "loss": 0.1942, "learning_rate": 5e-06, "epoch": 2.4739583333333335, "percentage": 82.47, "elapsed_time": "1:36:48", "remaining_time": "0:20:34"}
|
98 |
+
{"current_steps": 960, "total_steps": 1152, "loss": 0.1949, "learning_rate": 5e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "1:37:46", "remaining_time": "0:19:33"}
|
99 |
+
{"current_steps": 970, "total_steps": 1152, "loss": 0.1941, "learning_rate": 5e-06, "epoch": 2.5260416666666665, "percentage": 84.2, "elapsed_time": "1:38:44", "remaining_time": "0:18:31"}
|
100 |
+
{"current_steps": 980, "total_steps": 1152, "loss": 0.1935, "learning_rate": 5e-06, "epoch": 2.5520833333333335, "percentage": 85.07, "elapsed_time": "1:39:42", "remaining_time": "0:17:30"}
|
101 |
+
{"current_steps": 990, "total_steps": 1152, "loss": 0.1936, "learning_rate": 5e-06, "epoch": 2.578125, "percentage": 85.94, "elapsed_time": "1:40:40", "remaining_time": "0:16:28"}
|
102 |
+
{"current_steps": 1000, "total_steps": 1152, "loss": 0.1931, "learning_rate": 5e-06, "epoch": 2.6041666666666665, "percentage": 86.81, "elapsed_time": "1:41:39", "remaining_time": "0:15:27"}
|
103 |
+
{"current_steps": 1010, "total_steps": 1152, "loss": 0.1942, "learning_rate": 5e-06, "epoch": 2.6302083333333335, "percentage": 87.67, "elapsed_time": "1:42:37", "remaining_time": "0:14:25"}
|
104 |
+
{"current_steps": 1020, "total_steps": 1152, "loss": 0.1913, "learning_rate": 5e-06, "epoch": 2.65625, "percentage": 88.54, "elapsed_time": "1:43:35", "remaining_time": "0:13:24"}
|
105 |
+
{"current_steps": 1030, "total_steps": 1152, "loss": 0.1925, "learning_rate": 5e-06, "epoch": 2.6822916666666665, "percentage": 89.41, "elapsed_time": "1:44:34", "remaining_time": "0:12:23"}
|
106 |
+
{"current_steps": 1040, "total_steps": 1152, "loss": 0.1953, "learning_rate": 5e-06, "epoch": 2.7083333333333335, "percentage": 90.28, "elapsed_time": "1:45:32", "remaining_time": "0:11:21"}
|
107 |
+
{"current_steps": 1050, "total_steps": 1152, "loss": 0.192, "learning_rate": 5e-06, "epoch": 2.734375, "percentage": 91.15, "elapsed_time": "1:46:30", "remaining_time": "0:10:20"}
|
108 |
+
{"current_steps": 1060, "total_steps": 1152, "loss": 0.1958, "learning_rate": 5e-06, "epoch": 2.7604166666666665, "percentage": 92.01, "elapsed_time": "1:47:28", "remaining_time": "0:09:19"}
|
109 |
+
{"current_steps": 1070, "total_steps": 1152, "loss": 0.1921, "learning_rate": 5e-06, "epoch": 2.7864583333333335, "percentage": 92.88, "elapsed_time": "1:48:26", "remaining_time": "0:08:18"}
|
110 |
+
{"current_steps": 1080, "total_steps": 1152, "loss": 0.1926, "learning_rate": 5e-06, "epoch": 2.8125, "percentage": 93.75, "elapsed_time": "1:49:24", "remaining_time": "0:07:17"}
|
111 |
+
{"current_steps": 1090, "total_steps": 1152, "loss": 0.1953, "learning_rate": 5e-06, "epoch": 2.8385416666666665, "percentage": 94.62, "elapsed_time": "1:50:23", "remaining_time": "0:06:16"}
|
112 |
+
{"current_steps": 1100, "total_steps": 1152, "loss": 0.1951, "learning_rate": 5e-06, "epoch": 2.8645833333333335, "percentage": 95.49, "elapsed_time": "1:51:21", "remaining_time": "0:05:15"}
|
113 |
+
{"current_steps": 1110, "total_steps": 1152, "loss": 0.1901, "learning_rate": 5e-06, "epoch": 2.890625, "percentage": 96.35, "elapsed_time": "1:52:19", "remaining_time": "0:04:15"}
|
114 |
+
{"current_steps": 1120, "total_steps": 1152, "loss": 0.194, "learning_rate": 5e-06, "epoch": 2.9166666666666665, "percentage": 97.22, "elapsed_time": "1:53:17", "remaining_time": "0:03:14"}
|
115 |
+
{"current_steps": 1130, "total_steps": 1152, "loss": 0.1933, "learning_rate": 5e-06, "epoch": 2.9427083333333335, "percentage": 98.09, "elapsed_time": "1:54:16", "remaining_time": "0:02:13"}
|
116 |
+
{"current_steps": 1140, "total_steps": 1152, "loss": 0.1902, "learning_rate": 5e-06, "epoch": 2.96875, "percentage": 98.96, "elapsed_time": "1:55:14", "remaining_time": "0:01:12"}
|
117 |
+
{"current_steps": 1150, "total_steps": 1152, "loss": 0.1929, "learning_rate": 5e-06, "epoch": 2.9947916666666665, "percentage": 99.83, "elapsed_time": "1:56:12", "remaining_time": "0:00:12"}
|
118 |
+
{"current_steps": 1152, "total_steps": 1152, "eval_loss": 0.22828711569309235, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:58:41", "remaining_time": "0:00:00"}
|
119 |
+
{"current_steps": 1152, "total_steps": 1152, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:00:26", "remaining_time": "0:00:00"}
|