Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abc28d26f1d3cd9da19a5020c3d09c6e1a7d2010d2a921fd6fd0cc5c7005fde3
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38f408f7003878dc219f716828a8a3df6dedf96150541491006c8fa1f26e77a8
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10ca496697764c0eb732355ef7cf7d6bdcb303e1b4d793a8ba9506752fd58c71
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30daaa75319dce6896fe520e8ddf974003a7d1229ff778a85590404be8ef2202
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -80,3 +80,42 @@
|
|
80 |
{"current_steps": 782, "total_steps": 1173, "eval_loss": 0.6335848569869995, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:19:47", "remaining_time": "0:39:53"}
|
81 |
{"current_steps": 790, "total_steps": 1173, "loss": 0.5672, "learning_rate": 5e-06, "epoch": 2.020460358056266, "percentage": 67.35, "elapsed_time": "1:22:06", "remaining_time": "0:39:48"}
|
82 |
{"current_steps": 800, "total_steps": 1173, "loss": 0.5592, "learning_rate": 5e-06, "epoch": 2.0460358056265986, "percentage": 68.2, "elapsed_time": "1:23:05", "remaining_time": "0:38:44"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
80 |
{"current_steps": 782, "total_steps": 1173, "eval_loss": 0.6335848569869995, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:19:47", "remaining_time": "0:39:53"}
|
81 |
{"current_steps": 790, "total_steps": 1173, "loss": 0.5672, "learning_rate": 5e-06, "epoch": 2.020460358056266, "percentage": 67.35, "elapsed_time": "1:22:06", "remaining_time": "0:39:48"}
|
82 |
{"current_steps": 800, "total_steps": 1173, "loss": 0.5592, "learning_rate": 5e-06, "epoch": 2.0460358056265986, "percentage": 68.2, "elapsed_time": "1:23:05", "remaining_time": "0:38:44"}
|
83 |
+
{"current_steps": 810, "total_steps": 1173, "loss": 0.5431, "learning_rate": 5e-06, "epoch": 2.071611253196931, "percentage": 69.05, "elapsed_time": "1:24:04", "remaining_time": "0:37:40"}
|
84 |
+
{"current_steps": 820, "total_steps": 1173, "loss": 0.5558, "learning_rate": 5e-06, "epoch": 2.0971867007672635, "percentage": 69.91, "elapsed_time": "1:25:03", "remaining_time": "0:36:36"}
|
85 |
+
{"current_steps": 830, "total_steps": 1173, "loss": 0.549, "learning_rate": 5e-06, "epoch": 2.122762148337596, "percentage": 70.76, "elapsed_time": "1:26:01", "remaining_time": "0:35:33"}
|
86 |
+
{"current_steps": 840, "total_steps": 1173, "loss": 0.5595, "learning_rate": 5e-06, "epoch": 2.1483375959079285, "percentage": 71.61, "elapsed_time": "1:27:00", "remaining_time": "0:34:29"}
|
87 |
+
{"current_steps": 850, "total_steps": 1173, "loss": 0.5584, "learning_rate": 5e-06, "epoch": 2.1739130434782608, "percentage": 72.46, "elapsed_time": "1:27:58", "remaining_time": "0:33:25"}
|
88 |
+
{"current_steps": 860, "total_steps": 1173, "loss": 0.5556, "learning_rate": 5e-06, "epoch": 2.1994884910485935, "percentage": 73.32, "elapsed_time": "1:28:56", "remaining_time": "0:32:22"}
|
89 |
+
{"current_steps": 870, "total_steps": 1173, "loss": 0.5595, "learning_rate": 5e-06, "epoch": 2.2250639386189257, "percentage": 74.17, "elapsed_time": "1:29:55", "remaining_time": "0:31:19"}
|
90 |
+
{"current_steps": 880, "total_steps": 1173, "loss": 0.5541, "learning_rate": 5e-06, "epoch": 2.2506393861892584, "percentage": 75.02, "elapsed_time": "1:30:55", "remaining_time": "0:30:16"}
|
91 |
+
{"current_steps": 890, "total_steps": 1173, "loss": 0.5597, "learning_rate": 5e-06, "epoch": 2.2762148337595907, "percentage": 75.87, "elapsed_time": "1:31:53", "remaining_time": "0:29:13"}
|
92 |
+
{"current_steps": 900, "total_steps": 1173, "loss": 0.5585, "learning_rate": 5e-06, "epoch": 2.3017902813299234, "percentage": 76.73, "elapsed_time": "1:32:52", "remaining_time": "0:28:10"}
|
93 |
+
{"current_steps": 910, "total_steps": 1173, "loss": 0.553, "learning_rate": 5e-06, "epoch": 2.3273657289002556, "percentage": 77.58, "elapsed_time": "1:33:51", "remaining_time": "0:27:07"}
|
94 |
+
{"current_steps": 920, "total_steps": 1173, "loss": 0.5555, "learning_rate": 5e-06, "epoch": 2.3529411764705883, "percentage": 78.43, "elapsed_time": "1:34:50", "remaining_time": "0:26:04"}
|
95 |
+
{"current_steps": 930, "total_steps": 1173, "loss": 0.5539, "learning_rate": 5e-06, "epoch": 2.3785166240409206, "percentage": 79.28, "elapsed_time": "1:35:48", "remaining_time": "0:25:02"}
|
96 |
+
{"current_steps": 940, "total_steps": 1173, "loss": 0.5596, "learning_rate": 5e-06, "epoch": 2.4040920716112533, "percentage": 80.14, "elapsed_time": "1:36:46", "remaining_time": "0:23:59"}
|
97 |
+
{"current_steps": 950, "total_steps": 1173, "loss": 0.5575, "learning_rate": 5e-06, "epoch": 2.4296675191815855, "percentage": 80.99, "elapsed_time": "1:37:45", "remaining_time": "0:22:56"}
|
98 |
+
{"current_steps": 960, "total_steps": 1173, "loss": 0.562, "learning_rate": 5e-06, "epoch": 2.455242966751918, "percentage": 81.84, "elapsed_time": "1:38:43", "remaining_time": "0:21:54"}
|
99 |
+
{"current_steps": 970, "total_steps": 1173, "loss": 0.5555, "learning_rate": 5e-06, "epoch": 2.4808184143222505, "percentage": 82.69, "elapsed_time": "1:39:42", "remaining_time": "0:20:51"}
|
100 |
+
{"current_steps": 980, "total_steps": 1173, "loss": 0.5586, "learning_rate": 5e-06, "epoch": 2.506393861892583, "percentage": 83.55, "elapsed_time": "1:40:41", "remaining_time": "0:19:49"}
|
101 |
+
{"current_steps": 990, "total_steps": 1173, "loss": 0.5573, "learning_rate": 5e-06, "epoch": 2.531969309462916, "percentage": 84.4, "elapsed_time": "1:41:39", "remaining_time": "0:18:47"}
|
102 |
+
{"current_steps": 1000, "total_steps": 1173, "loss": 0.559, "learning_rate": 5e-06, "epoch": 2.557544757033248, "percentage": 85.25, "elapsed_time": "1:42:39", "remaining_time": "0:17:45"}
|
103 |
+
{"current_steps": 1010, "total_steps": 1173, "loss": 0.5663, "learning_rate": 5e-06, "epoch": 2.5831202046035804, "percentage": 86.1, "elapsed_time": "1:43:38", "remaining_time": "0:16:43"}
|
104 |
+
{"current_steps": 1020, "total_steps": 1173, "loss": 0.5639, "learning_rate": 5e-06, "epoch": 2.608695652173913, "percentage": 86.96, "elapsed_time": "1:44:37", "remaining_time": "0:15:41"}
|
105 |
+
{"current_steps": 1030, "total_steps": 1173, "loss": 0.5605, "learning_rate": 5e-06, "epoch": 2.634271099744246, "percentage": 87.81, "elapsed_time": "1:45:36", "remaining_time": "0:14:39"}
|
106 |
+
{"current_steps": 1040, "total_steps": 1173, "loss": 0.5629, "learning_rate": 5e-06, "epoch": 2.659846547314578, "percentage": 88.66, "elapsed_time": "1:46:36", "remaining_time": "0:13:37"}
|
107 |
+
{"current_steps": 1050, "total_steps": 1173, "loss": 0.5559, "learning_rate": 5e-06, "epoch": 2.6854219948849103, "percentage": 89.51, "elapsed_time": "1:47:35", "remaining_time": "0:12:36"}
|
108 |
+
{"current_steps": 1060, "total_steps": 1173, "loss": 0.5602, "learning_rate": 5e-06, "epoch": 2.710997442455243, "percentage": 90.37, "elapsed_time": "1:48:34", "remaining_time": "0:11:34"}
|
109 |
+
{"current_steps": 1070, "total_steps": 1173, "loss": 0.5647, "learning_rate": 5e-06, "epoch": 2.7365728900255757, "percentage": 91.22, "elapsed_time": "1:49:33", "remaining_time": "0:10:32"}
|
110 |
+
{"current_steps": 1080, "total_steps": 1173, "loss": 0.5561, "learning_rate": 5e-06, "epoch": 2.762148337595908, "percentage": 92.07, "elapsed_time": "1:50:32", "remaining_time": "0:09:31"}
|
111 |
+
{"current_steps": 1090, "total_steps": 1173, "loss": 0.5536, "learning_rate": 5e-06, "epoch": 2.78772378516624, "percentage": 92.92, "elapsed_time": "1:51:31", "remaining_time": "0:08:29"}
|
112 |
+
{"current_steps": 1100, "total_steps": 1173, "loss": 0.5579, "learning_rate": 5e-06, "epoch": 2.813299232736573, "percentage": 93.78, "elapsed_time": "1:52:29", "remaining_time": "0:07:27"}
|
113 |
+
{"current_steps": 1110, "total_steps": 1173, "loss": 0.5629, "learning_rate": 5e-06, "epoch": 2.8388746803069056, "percentage": 94.63, "elapsed_time": "1:53:27", "remaining_time": "0:06:26"}
|
114 |
+
{"current_steps": 1120, "total_steps": 1173, "loss": 0.5662, "learning_rate": 5e-06, "epoch": 2.864450127877238, "percentage": 95.48, "elapsed_time": "1:54:26", "remaining_time": "0:05:24"}
|
115 |
+
{"current_steps": 1130, "total_steps": 1173, "loss": 0.5622, "learning_rate": 5e-06, "epoch": 2.89002557544757, "percentage": 96.33, "elapsed_time": "1:55:24", "remaining_time": "0:04:23"}
|
116 |
+
{"current_steps": 1140, "total_steps": 1173, "loss": 0.5613, "learning_rate": 5e-06, "epoch": 2.915601023017903, "percentage": 97.19, "elapsed_time": "1:56:23", "remaining_time": "0:03:22"}
|
117 |
+
{"current_steps": 1150, "total_steps": 1173, "loss": 0.5634, "learning_rate": 5e-06, "epoch": 2.9411764705882355, "percentage": 98.04, "elapsed_time": "1:57:21", "remaining_time": "0:02:20"}
|
118 |
+
{"current_steps": 1160, "total_steps": 1173, "loss": 0.5549, "learning_rate": 5e-06, "epoch": 2.9667519181585678, "percentage": 98.89, "elapsed_time": "1:58:21", "remaining_time": "0:01:19"}
|
119 |
+
{"current_steps": 1170, "total_steps": 1173, "loss": 0.5549, "learning_rate": 5e-06, "epoch": 2.9923273657289, "percentage": 99.74, "elapsed_time": "1:59:20", "remaining_time": "0:00:18"}
|
120 |
+
{"current_steps": 1173, "total_steps": 1173, "eval_loss": 0.6347914934158325, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:01:49", "remaining_time": "0:00:00"}
|
121 |
+
{"current_steps": 1173, "total_steps": 1173, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:03:18", "remaining_time": "0:00:00"}
|