aissatoubalde
commited on
Commit
•
fe490e0
1
Parent(s):
cc55646
Training in progress, epoch 0
Browse files- .ipynb_checkpoints/phi-2-custom-checkpoint.ipynb +0 -0
- adapter_config.json +6 -0
- fine-tuned-phi2.ipynb +9 -1002
- phi-2-custom.ipynb +0 -0
- training_args.bin +1 -1
.ipynb_checkpoints/phi-2-custom-checkpoint.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
adapter_config.json
CHANGED
@@ -18,6 +18,12 @@
|
|
18 |
"r": 16,
|
19 |
"rank_pattern": {},
|
20 |
"revision": null,
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
"task_type": "CAUSAL_LM",
|
22 |
"use_rslora": false
|
23 |
}
|
|
|
18 |
"r": 16,
|
19 |
"rank_pattern": {},
|
20 |
"revision": null,
|
21 |
+
"target_modules": [
|
22 |
+
"fc2",
|
23 |
+
"fc1",
|
24 |
+
"v_proj",
|
25 |
+
"q_proj"
|
26 |
+
],
|
27 |
"task_type": "CAUSAL_LM",
|
28 |
"use_rslora": false
|
29 |
}
|
fine-tuned-phi2.ipynb
CHANGED
@@ -225,20 +225,10 @@
|
|
225 |
},
|
226 |
{
|
227 |
"cell_type": "code",
|
228 |
-
"execution_count":
|
229 |
"id": "75a61ec8-e440-42b0-8b4d-e3cb05841b71",
|
230 |
"metadata": {},
|
231 |
-
"outputs": [
|
232 |
-
{
|
233 |
-
"name": "stderr",
|
234 |
-
"output_type": "stream",
|
235 |
-
"text": [
|
236 |
-
"/usr/local/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
|
237 |
-
" from .autonotebook import tqdm as notebook_tqdm\n",
|
238 |
-
"2024-02-15 17:38:51,139\tINFO util.py:154 -- Missing packages: ['ipywidgets']. Run `pip install -U ipywidgets`, then restart the notebook server for rich notebook output.\n"
|
239 |
-
]
|
240 |
-
}
|
241 |
-
],
|
242 |
"source": [
|
243 |
"import torch\n",
|
244 |
"import numpy as np\n",
|
@@ -250,31 +240,23 @@
|
|
250 |
},
|
251 |
{
|
252 |
"cell_type": "code",
|
253 |
-
"execution_count":
|
254 |
"id": "7d29ba48-d4b0-4f24-8f88-560d9bed100c",
|
255 |
"metadata": {
|
256 |
"scrolled": true
|
257 |
},
|
258 |
"outputs": [
|
259 |
-
{
|
260 |
-
"name": "stderr",
|
261 |
-
"output_type": "stream",
|
262 |
-
"text": [
|
263 |
-
"config.json: 100%|██████████| 897/897 [00:00<00:00, 6.40MB/s]"
|
264 |
-
]
|
265 |
-
},
|
266 |
{
|
267 |
"name": "stdout",
|
268 |
"output_type": "stream",
|
269 |
"text": [
|
270 |
-
"INFO 02-15
|
271 |
]
|
272 |
},
|
273 |
{
|
274 |
"name": "stderr",
|
275 |
"output_type": "stream",
|
276 |
"text": [
|
277 |
-
"\n",
|
278 |
"Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
|
279 |
]
|
280 |
},
|
@@ -282,992 +264,17 @@
|
|
282 |
"name": "stdout",
|
283 |
"output_type": "stream",
|
284 |
"text": [
|
285 |
-
"INFO 02-15
|
286 |
-
]
|
287 |
-
},
|
288 |
-
{
|
289 |
-
"name": "stderr",
|
290 |
-
"output_type": "stream",
|
291 |
-
"text": [
|
292 |
-
"model-00003-of-00003.safetensors: 0%| | 0.00/1.15G [00:00<?, ?B/s]\n",
|
293 |
-
"model-00001-of-00003.safetensors: 0%| | 0.00/4.98G [00:00<?, ?B/s]\u001b[A\n",
|
294 |
-
"\n",
|
295 |
-
"model-00003-of-00003.safetensors: 2%|▏ | 21.0M/1.15G [00:00<00:13, 82.8MB/s]\n",
|
296 |
-
"model-00001-of-00003.safetensors: 0%| | 21.0M/4.98G [00:00<01:01, 80.2MB/s]\u001b[A\n",
|
297 |
-
"\n",
|
298 |
-
"model-00003-of-00003.safetensors: 4%|▎ | 41.9M/1.15G [00:00<00:09, 112MB/s] \u001b[A\u001b[A\n",
|
299 |
-
"\n",
|
300 |
-
"model-00002-of-00003.safetensors: 1%| | 31.5M/4.98G [00:00<00:56, 87.1MB/s]\u001b[A\u001b[A\n",
|
301 |
-
"model-00001-of-00003.safetensors: 1%| | 41.9M/4.98G [00:00<00:55, 89.8MB/s]\u001b[A\n",
|
302 |
-
"\n",
|
303 |
-
"model-00002-of-00003.safetensors: 1%| | 41.9M/4.98G [00:00<01:03, 78.0MB/s]\u001b[A\u001b[A\n",
|
304 |
-
"\n",
|
305 |
-
"model-00002-of-00003.safetensors: 1%| | 52.4M/4.98G [00:00<00:59, 82.3MB/s]\u001b[A\u001b[A\n",
|
306 |
-
"model-00001-of-00003.safetensors: 1%| | 52.4M/4.98G [00:00<01:24, 58.1MB/s]\u001b[A\n",
|
307 |
-
"\n",
|
308 |
-
"model-00002-of-00003.safetensors: 1%|▏ | 73.4M/4.98G [00:00<00:59, 82.0MB/s]\u001b[A\u001b[A\n",
|
309 |
-
"model-00001-of-00003.safetensors: 1%|▏ | 73.4M/4.98G [00:01<01:16, 64.0MB/s]\u001b[A\n",
|
310 |
-
"\n",
|
311 |
-
"model-00003-of-00003.safetensors: 5%|▌ | 62.9M/1.15G [00:01<00:25, 43.0MB/s]\u001b[A\u001b[A\n",
|
312 |
-
"model-00001-of-00003.safetensors: 2%|▏ | 83.9M/4.98G [00:01<01:22, 59.1MB/s]\u001b[A\n",
|
313 |
-
"\n",
|
314 |
-
"model-00003-of-00003.safetensors: 6%|▋ | 73.4M/1.15G [00:01<00:23, 46.8MB/s]\u001b[A\u001b[A\n",
|
315 |
-
"model-00001-of-00003.safetensors: 2%|▏ | 94.4M/4.98G [00:01<01:19, 61.3MB/s]\u001b[A\n",
|
316 |
-
"\n",
|
317 |
-
"model-00002-of-00003.safetensors: 2%|▏ | 115M/4.98G [00:01<01:00, 79.9MB/s]\u001b[A\u001b[A\n",
|
318 |
-
"model-00001-of-00003.safetensors: 2%|▏ | 105M/4.98G [00:01<01:21, 60.1MB/s] \u001b[A\n",
|
319 |
-
"\n",
|
320 |
-
"model-00002-of-00003.safetensors: 3%|▎ | 136M/4.98G [00:01<01:06, 72.9MB/s]\u001b[A\u001b[A\n",
|
321 |
-
"model-00003-of-00003.safetensors: 7%|▋ | 83.9M/1.15G [00:01<00:29, 35.7MB/s][A\n",
|
322 |
-
"\n",
|
323 |
-
"model-00002-of-00003.safetensors: 3%|▎ | 147M/4.98G [00:01<01:09, 69.6MB/s]\u001b[A\u001b[A\n",
|
324 |
-
"model-00001-of-00003.safetensors: 3%|▎ | 136M/4.98G [00:02<01:18, 61.6MB/s]\u001b[A\n",
|
325 |
-
"\n",
|
326 |
-
"model-00003-of-00003.safetensors: 8%|▊ | 94.4M/1.15G [00:02<00:35, 29.9MB/s][A\u001b[A\n",
|
327 |
-
"model-00003-of-00003.safetensors: 9%|▉ | 105M/1.15G [00:02<00:29, 35.8MB/s] [A\n",
|
328 |
-
"\n",
|
329 |
-
"model-00003-of-00003.safetensors: 10%|▉ | 115M/1.15G [00:02<00:25, 41.5MB/s]\u001b[A\u001b[A\n",
|
330 |
-
"model-00001-of-00003.safetensors: 3%|▎ | 168M/4.98G [00:02<01:18, 61.4MB/s]\u001b[A\n",
|
331 |
-
"\n",
|
332 |
-
"model-00002-of-00003.safetensors: 4%|▍ | 199M/4.98G [00:02<01:12, 65.8MB/s]\u001b[A\u001b[A\n",
|
333 |
-
"model-00001-of-00003.safetensors: 4%|▎ | 178M/4.98G [00:02<01:19, 60.5MB/s]\u001b[A\n",
|
334 |
-
"\n",
|
335 |
-
"model-00002-of-00003.safetensors: 4%|▍ | 210M/4.98G [00:02<01:09, 68.7MB/s]\u001b[A\u001b[A\n",
|
336 |
-
"model-00001-of-00003.safetensors: 4%|▍ | 199M/4.98G [00:03<01:11, 67.0MB/s]\u001b[A\n",
|
337 |
-
"\n",
|
338 |
-
"model-00002-of-00003.safetensors: 5%|▍ | 231M/4.98G [00:03<01:00, 78.9MB/s]\u001b[A\u001b[A\n",
|
339 |
-
"\n",
|
340 |
-
"model-00003-of-00003.safetensors: 12%|█▏ | 136M/1.15G [00:03<00:27, 37.0MB/s]\u001b[A\u001b[A\n",
|
341 |
-
"model-00003-of-00003.safetensors: 13%|█▎ | 147M/1.15G [00:03<00:26, 37.7MB/s]\u001b[A\n",
|
342 |
-
"model-00003-of-00003.safetensors: 15%|█▍ | 168M/1.15G [00:03<00:19, 51.6MB/s]\u001b[A\n",
|
343 |
-
"\n",
|
344 |
-
"model-00002-of-00003.safetensors: 5%|▌ | 262M/4.98G [00:03<01:26, 54.9MB/s]\u001b[A\u001b[A\n",
|
345 |
-
"model-00001-of-00003.safetensors: 5%|▍ | 231M/4.98G [00:03<01:41, 46.6MB/s]\u001b[A\n",
|
346 |
-
"\n",
|
347 |
-
"model-00002-of-00003.safetensors: 5%|▌ | 273M/4.98G [00:04<01:28, 53.1MB/s]\u001b[A\u001b[A\n",
|
348 |
-
"model-00003-of-00003.safetensors: 15%|█▌ | 178M/1.15G [00:04<00:24, 39.3MB/s]\u001b[A\n",
|
349 |
-
"\n",
|
350 |
-
"model-00002-of-00003.safetensors: 6%|▌ | 294M/4.98G [00:04<01:18, 59.7MB/s]\u001b[A\u001b[A\n",
|
351 |
-
"model-00003-of-00003.safetensors: 17%|█▋ | 199M/1.15G [00:04<00:18, 53.0MB/s]\u001b[A\n",
|
352 |
-
"\n",
|
353 |
-
"model-00002-of-00003.safetensors: 6%|▌ | 304M/4.98G [00:04<01:21, 57.5MB/s]\u001b[A\u001b[A\n",
|
354 |
-
"model-00003-of-00003.safetensors: 18%|█▊ | 210M/1.15G [00:04<00:22, 42.1MB/s]\u001b[A\n",
|
355 |
-
"\n",
|
356 |
-
"model-00003-of-00003.safetensors: 19%|█▉ | 220M/1.15G [00:05<00:19, 47.1MB/s]\u001b[A\u001b[A\n",
|
357 |
-
"\n",
|
358 |
-
"model-00002-of-00003.safetensors: 7%|▋ | 336M/4.98G [00:05<01:19, 58.4MB/s]\u001b[A\u001b[A\n",
|
359 |
-
"model-00001-of-00003.safetensors: 6%|▌ | 294M/4.98G [00:05<01:36, 48.7MB/s]\u001b[A\n",
|
360 |
-
"\n",
|
361 |
-
"model-00003-of-00003.safetensors: 21%|██ | 241M/1.15G [00:05<00:20, 43.7MB/s]\u001b[A\u001b[A\n",
|
362 |
-
"model-00001-of-00003.safetensors: 6%|▌ | 304M/4.98G [00:05<01:51, 42.0MB/s]\u001b[A\n",
|
363 |
-
"\n",
|
364 |
-
"model-00002-of-00003.safetensors: 7%|▋ | 357M/4.98G [00:05<01:32, 49.8MB/s]\u001b[A\u001b[A\n",
|
365 |
-
"model-00001-of-00003.safetensors: 6%|▋ | 315M/4.98G [00:05<01:42, 45.4MB/s]\u001b[A\n",
|
366 |
-
"\n",
|
367 |
-
"model-00003-of-00003.safetensors: 22%|██▏ | 252M/1.15G [00:05<00:21, 41.3MB/s]\u001b[A\u001b[A\n",
|
368 |
-
"\n",
|
369 |
-
"model-00003-of-00003.safetensors: 23%|██▎ | 262M/1.15G [00:05<00:18, 48.4MB/s]\u001b[A\u001b[A\n",
|
370 |
-
"\n",
|
371 |
-
"model-00002-of-00003.safetensors: 8%|▊ | 388M/4.98G [00:06<01:23, 55.1MB/s]\u001b[A\u001b[A\n",
|
372 |
-
"model-00003-of-00003.safetensors: 24%|██▎ | 273M/1.15G [00:06<00:18, 48.6MB/s]\u001b[A\n",
|
373 |
-
"model-00003-of-00003.safetensors: 25%|██▌ | 294M/1.15G [00:06<00:14, 61.2MB/s]\u001b[A\n",
|
374 |
-
"model-00001-of-00003.safetensors: 7%|▋ | 346M/4.98G [00:06<01:34, 48.9MB/s]\u001b[A\n",
|
375 |
-
"\n",
|
376 |
-
"model-00002-of-00003.safetensors: 8%|▊ | 409M/4.98G [00:06<01:17, 58.7MB/s]\u001b[A\u001b[A\n",
|
377 |
-
"\n",
|
378 |
-
"model-00002-of-00003.safetensors: 8%|▊ | 419M/4.98G [00:06<01:12, 63.3MB/s]\u001b[A\u001b[A\n",
|
379 |
-
"model-00003-of-00003.safetensors: 29%|██▉ | 336M/1.15G [00:06<00:09, 83.7MB/s]\u001b[A\n",
|
380 |
-
"\n",
|
381 |
-
"model-00002-of-00003.safetensors: 9%|▉ | 440M/4.98G [00:06<01:01, 73.6MB/s]\u001b[A\u001b[A\n",
|
382 |
-
"model-00001-of-00003.safetensors: 8%|▊ | 377M/4.98G [00:06<01:16, 60.6MB/s]\u001b[A\n",
|
383 |
-
"\n",
|
384 |
-
"model-00003-of-00003.safetensors: 30%|██▉ | 346M/1.15G [00:06<00:10, 76.1MB/s]\u001b[A\u001b[A\n",
|
385 |
-
"model-00001-of-00003.safetensors: 8%|▊ | 388M/4.98G [00:07<01:18, 58.2MB/s]\u001b[A\n",
|
386 |
-
"\n",
|
387 |
-
"model-00003-of-00003.safetensors: 31%|███ | 357M/1.15G [00:07<00:14, 53.4MB/s]\u001b[A\u001b[A\n",
|
388 |
-
"model-00001-of-00003.safetensors: 8%|▊ | 398M/4.98G [00:07<01:27, 52.6MB/s]\u001b[A\n",
|
389 |
-
"\n",
|
390 |
-
"model-00002-of-00003.safetensors: 10%|▉ | 482M/4.98G [00:07<01:14, 60.6MB/s]\u001b[A\u001b[A\n",
|
391 |
-
"model-00003-of-00003.safetensors: 33%|███▎ | 377M/1.15G [00:07<00:12, 62.3MB/s]\u001b[A\n",
|
392 |
-
"model-00001-of-00003.safetensors: 8%|▊ | 419M/4.98G [00:07<01:27, 52.4MB/s]\u001b[A\n",
|
393 |
-
"\n",
|
394 |
-
"model-00003-of-00003.safetensors: 34%|███▎ | 388M/1.15G [00:07<00:15, 50.9MB/s]\u001b[A\u001b[A\n",
|
395 |
-
"model-00001-of-00003.safetensors: 9%|▉ | 440M/4.98G [00:07<01:12, 62.9MB/s]\u001b[A\n",
|
396 |
-
"\n",
|
397 |
-
"model-00003-of-00003.safetensors: 35%|███▌ | 409M/1.15G [00:08<00:12, 57.7MB/s]\u001b[A\u001b[A\n",
|
398 |
-
"model-00003-of-00003.safetensors: 36%|███▋ | 419M/1.15G [00:08<00:12, 59.2MB/s]\u001b[A\n",
|
399 |
-
"\n",
|
400 |
-
"model-00002-of-00003.safetensors: 11%|█ | 535M/4.98G [00:08<01:21, 54.9MB/s]\u001b[A\u001b[A\n",
|
401 |
-
"model-00003-of-00003.safetensors: 38%|███▊ | 440M/1.15G [00:08<00:11, 64.5MB/s]\u001b[A\n",
|
402 |
-
"model-00001-of-00003.safetensors: 10%|▉ | 482M/4.98G [00:08<01:16, 59.0MB/s]\u001b[A\n",
|
403 |
-
"\n",
|
404 |
-
"model-00002-of-00003.safetensors: 11%|█ | 545M/4.98G [00:08<01:39, 44.6MB/s]\u001b[A\u001b[A\n",
|
405 |
-
"model-00003-of-00003.safetensors: 39%|███▉ | 451M/1.15G [00:09<00:14, 49.7MB/s]\u001b[A\n",
|
406 |
-
"\n",
|
407 |
-
"model-00003-of-00003.safetensors: 40%|███▉ | 461M/1.15G [00:09<00:12, 53.8MB/s]\u001b[A\u001b[A\n",
|
408 |
-
"model-00003-of-00003.safetensors: 41%|████ | 472M/1.15G [00:09<00:12, 56.4MB/s]\u001b[A\n",
|
409 |
-
"\n",
|
410 |
-
"model-00003-of-00003.safetensors: 42%|████▏ | 482M/1.15G [00:09<00:11, 56.5MB/s]\u001b[A\u001b[A\n",
|
411 |
-
"\n",
|
412 |
-
"model-00002-of-00003.safetensors: 12%|█▏ | 598M/4.98G [00:09<01:24, 52.2MB/s]\u001b[A\u001b[A\n",
|
413 |
-
"model-00003-of-00003.safetensors: 44%|████▎ | 503M/1.15G [00:09<00:09, 69.6MB/s]\u001b[A\n",
|
414 |
-
"\n",
|
415 |
-
"model-00002-of-00003.safetensors: 12%|█▏ | 608M/4.98G [00:09<01:24, 51.6MB/s]\u001b[A\u001b[A\n",
|
416 |
-
"model-00003-of-00003.safetensors: 45%|████▍ | 514M/1.15G [00:09<00:10, 59.1MB/s]\u001b[A\n",
|
417 |
-
"\n",
|
418 |
-
"model-00002-of-00003.safetensors: 12%|█▏ | 619M/4.98G [00:10<01:23, 52.1MB/s]\u001b[A\u001b[A\n",
|
419 |
-
"model-00003-of-00003.safetensors: 46%|████▋ | 535M/1.15G [00:10<00:08, 71.5MB/s]\u001b[A\n",
|
420 |
-
"\n",
|
421 |
-
"model-00002-of-00003.safetensors: 13%|█▎ | 629M/4.98G [00:10<01:18, 55.5MB/s]\u001b[A\u001b[A\n",
|
422 |
-
"\n",
|
423 |
-
"model-00003-of-00003.safetensors: 47%|████▋ | 545M/1.15G [00:10<00:09, 67.2MB/s]\u001b[A\u001b[A\n",
|
424 |
-
"model-00001-of-00003.safetensors: 11%|█▏ | 566M/4.98G [00:10<01:26, 51.3MB/s]\u001b[A\n",
|
425 |
-
"\n",
|
426 |
-
"model-00002-of-00003.safetensors: 13%|█▎ | 650M/4.98G [00:10<01:06, 65.6MB/s]\u001b[A\u001b[A\n",
|
427 |
-
"\n",
|
428 |
-
"model-00002-of-00003.safetensors: 13%|█▎ | 661M/4.98G [00:10<00:59, 72.8MB/s]\u001b[A\u001b[A\n",
|
429 |
-
"\n",
|
430 |
-
"model-00002-of-00003.safetensors: 14%|█▎ | 682M/4.98G [00:10<00:53, 81.0MB/s]\u001b[A\u001b[A\n",
|
431 |
-
"model-00003-of-00003.safetensors: 49%|████▉ | 566M/1.15G [00:11<00:12, 46.4MB/s]\u001b[A\n",
|
432 |
-
"\n",
|
433 |
-
"model-00002-of-00003.safetensors: 14%|█▍ | 692M/4.98G [00:11<01:10, 60.8MB/s]\u001b[A\u001b[A\n",
|
434 |
-
"model-00003-of-00003.safetensors: 52%|█████▏ | 598M/1.15G [00:11<00:09, 58.9MB/s]\u001b[A\n",
|
435 |
-
"model-00003-of-00003.safetensors: 53%|█████▎ | 608M/1.15G [00:11<00:09, 56.4MB/s]\u001b[A\n",
|
436 |
-
"\n",
|
437 |
-
"model-00002-of-00003.safetensors: 14%|█▍ | 703M/4.98G [00:11<01:57, 36.5MB/s]\u001b[A\u001b[A\n",
|
438 |
-
"model-00001-of-00003.safetensors: 13%|█▎ | 629M/4.98G [00:11<01:22, 52.9MB/s]\u001b[A\n",
|
439 |
-
"\n",
|
440 |
-
"model-00002-of-00003.safetensors: 15%|█▍ | 744M/4.98G [00:11<00:59, 70.6MB/s]\u001b[A\u001b[A\n",
|
441 |
-
"model-00003-of-00003.safetensors: 55%|█████▍ | 629M/1.15G [00:12<00:08, 59.7MB/s]\u001b[A\n",
|
442 |
-
"model-00001-of-00003.safetensors: 13%|█▎ | 650M/4.98G [00:12<01:11, 60.4MB/s]\u001b[A\n",
|
443 |
-
"\n",
|
444 |
-
"model-00003-of-00003.safetensors: 55%|█████▌ | 640M/1.15G [00:12<00:08, 62.1MB/s]\u001b[A\u001b[A\n",
|
445 |
-
"\n",
|
446 |
-
"model-00003-of-00003.safetensors: 56%|█████▋ | 650M/1.15G [00:12<00:08, 61.3MB/s]\u001b[A\u001b[A\n",
|
447 |
-
"model-00001-of-00003.safetensors: 13%|█▎ | 661M/4.98G [00:12<01:19, 54.3MB/s]\u001b[A\n",
|
448 |
-
"\n",
|
449 |
-
"model-00002-of-00003.safetensors: 16%|█▌ | 776M/4.98G [00:12<01:09, 60.9MB/s]\u001b[A\u001b[A\n",
|
450 |
-
"model-00003-of-00003.safetensors: 57%|█████▋ | 661M/1.15G [00:13<00:18, 26.1MB/s]\u001b[A\n",
|
451 |
-
"model-00001-of-00003.safetensors: 14%|█▍ | 692M/4.98G [00:13<02:04, 34.4MB/s]\u001b[A\n",
|
452 |
-
"\n",
|
453 |
-
"model-00003-of-00003.safetensors: 58%|█████▊ | 671M/1.15G [00:14<00:26, 18.4MB/s]\u001b[A\u001b[A\n",
|
454 |
-
"\n",
|
455 |
-
"model-00002-of-00003.safetensors: 16%|█▌ | 797M/4.98G [00:14<03:36, 19.4MB/s]\u001b[A\u001b[A\n",
|
456 |
-
"model-00003-of-00003.safetensors: 61%|██████ | 703M/1.15G [00:14<00:12, 36.5MB/s]\u001b[A\n",
|
457 |
-
"model-00001-of-00003.safetensors: 15%|█▌ | 755M/4.98G [00:14<01:21, 52.1MB/s]\u001b[A\n",
|
458 |
-
"\n",
|
459 |
-
"model-00003-of-00003.safetensors: 65%|██████▌ | 755M/1.15G [00:14<00:05, 74.6MB/s]\u001b[A\u001b[A\n",
|
460 |
-
"\n",
|
461 |
-
"model-00002-of-00003.safetensors: 18%|█▊ | 881M/4.98G [00:14<00:55, 74.5MB/s]\u001b[A\u001b[A\n",
|
462 |
-
"model-00003-of-00003.safetensors: 68%|██████▊ | 786M/1.15G [00:14<00:04, 87.3MB/s]\u001b[A\n",
|
463 |
-
"\n",
|
464 |
-
"model-00003-of-00003.safetensors: 70%|██████▉ | 807M/1.15G [00:15<00:03, 92.4MB/s]\u001b[A\u001b[A\n",
|
465 |
-
"\n",
|
466 |
-
"model-00002-of-00003.safetensors: 19%|█▊ | 923M/4.98G [00:15<00:53, 76.6MB/s]\u001b[A\u001b[A\n",
|
467 |
-
"model-00001-of-00003.safetensors: 16%|█▌ | 797M/4.98G [00:15<01:22, 50.6MB/s]\u001b[A\n",
|
468 |
-
"model-00001-of-00003.safetensors: 16%|█▋ | 818M/4.98G [00:15<01:26, 48.1MB/s]\u001b[A\n",
|
469 |
-
"model-00003-of-00003.safetensors: 72%|███████▏ | 828M/1.15G [00:16<00:07, 42.6MB/s]\u001b[A\n",
|
470 |
-
"\n",
|
471 |
-
"model-00003-of-00003.safetensors: 75%|███████▌ | 870M/1.15G [00:16<00:04, 67.9MB/s]\u001b[A\u001b[A\n",
|
472 |
-
"model-00003-of-00003.safetensors: 78%|███████▊ | 902M/1.15G [00:17<00:05, 43.1MB/s]\u001b[A\n",
|
473 |
-
"\n",
|
474 |
-
"model-00002-of-00003.safetensors: 20%|█▉ | 975M/4.98G [00:17<02:05, 32.0MB/s]\u001b[A\u001b[A\n",
|
475 |
-
"model-00001-of-00003.safetensors: 17%|█▋ | 849M/4.98G [00:17<03:05, 22.3MB/s]\u001b[A\n",
|
476 |
-
"\n",
|
477 |
-
"model-00003-of-00003.safetensors: 81%|████████ | 933M/1.15G [00:19<00:06, 36.5MB/s]]\u001b[A\u001b[A\n",
|
478 |
-
"model-00001-of-00003.safetensors: 17%|█▋ | 870M/4.98G [00:19<03:20, 20.5MB/s]\u001b[A\n",
|
479 |
-
"\n",
|
480 |
-
"model-00003-of-00003.safetensors: 85%|████████▍ | 975M/1.15G [00:19<00:03, 54.8MB/s]]\u001b[A\u001b[A\n",
|
481 |
-
"model-00001-of-00003.safetensors: 18%|█▊ | 912M/4.98G [00:19<01:40, 40.6MB/s]\u001b[A\n",
|
482 |
-
"\n",
|
483 |
-
"model-00002-of-00003.safetensors: 22%|██▏ | 1.08G/4.98G [00:19<01:04, 60.2MB/s]\u001b[A\u001b[A\n",
|
484 |
-
"\n",
|
485 |
-
"model-00002-of-00003.safetensors: 22%|██▏ | 1.11G/4.98G [00:19<00:50, 77.2MB/s]\u001b[A\u001b[A\n",
|
486 |
-
"model-00003-of-00003.safetensors: 93%|█████████▎| 1.07G/1.15G [00:20<00:01, 73.8MB/s][A\n",
|
487 |
-
"model-00003-of-00003.safetensors: 95%|█████████▍| 1.09G/1.15G [00:20<00:00, 72.8MB/s][A\n",
|
488 |
-
"\n",
|
489 |
-
"model-00002-of-00003.safetensors: 23%|██▎ | 1.14G/4.98G [00:20<01:20, 47.4MB/s]\u001b[A\u001b[A\n",
|
490 |
-
"model-00003-of-00003.safetensors: 96%|█████████▋| 1.11G/1.15G [00:20<00:00, 69.0MB/s][A\n",
|
491 |
-
"\n",
|
492 |
-
"model-00002-of-00003.safetensors: 24%|██▍ | 1.18G/4.98G [00:20<00:55, 68.9MB/s]\u001b[A\u001b[A\n",
|
493 |
-
"model-00001-of-00003.safetensors: 20%|█▉ | 996M/4.98G [00:20<01:19, 50.1MB/s]\u001b[A\n",
|
494 |
-
"\n",
|
495 |
-
"model-00003-of-00003.safetensors: 97%|█████████▋| 1.12G/1.15G [00:20<00:00, 68.7MB/s]\u001b[A\u001b[A\n",
|
496 |
-
"model-00001-of-00003.safetensors: 20%|██ | 1.02G/4.98G [00:20<01:10, 56.5MB/s]\u001b[A\n",
|
497 |
-
"\n",
|
498 |
-
"model-00002-of-00003.safetensors: 25%|██▌ | 1.25G/4.98G [00:21<00:42, 88.8MB/s]\u001b[A\u001b[A\n",
|
499 |
-
"model-00003-of-00003.safetensors: 99%|█████████▉| 1.14G/1.15G [00:21<00:00, 53.6MB/s]\u001b[A\n",
|
500 |
-
"\n",
|
501 |
-
"model-00003-of-00003.safetensors: 100%|██████████| 1.15G/1.15G [00:21<00:00, 53.4MB/s]\u001b[A\u001b[A\n",
|
502 |
-
"\n",
|
503 |
-
"model-00001-of-00003.safetensors: 21%|██ | 1.05G/4.98G [00:21<01:14, 52.8MB/s]\u001b[A\n",
|
504 |
-
"model-00001-of-00003.safetensors: 21%|██▏ | 1.06G/4.98G [00:21<01:23, 46.8MB/s]\u001b[A\n",
|
505 |
-
"\n",
|
506 |
-
"model-00002-of-00003.safetensors: 26%|██▌ | 1.29G/4.98G [00:22<01:06, 55.4MB/s]\u001b[A\u001b[A\n",
|
507 |
-
"model-00001-of-00003.safetensors: 22%|██▏ | 1.08G/4.98G [00:22<01:18, 49.6MB/s]\u001b[A\n",
|
508 |
-
"model-00001-of-00003.safetensors: 22%|██▏ | 1.09G/4.98G [00:22<01:15, 51.6MB/s]\u001b[A\n",
|
509 |
-
"\n",
|
510 |
-
"model-00002-of-00003.safetensors: 26%|██▋ | 1.31G/4.98G [00:22<01:05, 56.0MB/s]\u001b[A\u001b[A\n",
|
511 |
-
"model-00001-of-00003.safetensors: 22%|██▏ | 1.11G/4.98G [00:22<01:13, 52.7MB/s]\u001b[A\n",
|
512 |
-
"model-00001-of-00003.safetensors: 23%|██▎ | 1.12G/4.98G [00:23<01:25, 45.0MB/s]\u001b[A\n",
|
513 |
-
"\n",
|
514 |
-
"model-00002-of-00003.safetensors: 27%|██▋ | 1.32G/4.98G [00:23<01:31, 40.0MB/s]\u001b[A\u001b[A\n",
|
515 |
-
"model-00001-of-00003.safetensors: 23%|██▎ | 1.14G/4.98G [00:23<01:15, 50.8MB/s]\u001b[A\n",
|
516 |
-
"\n",
|
517 |
-
"model-00002-of-00003.safetensors: 27%|██▋ | 1.33G/4.98G [00:23<01:33, 39.1MB/s]\u001b[A\u001b[A\n",
|
518 |
-
"\n",
|
519 |
-
"model-00002-of-00003.safetensors: 27%|██▋ | 1.34G/4.98G [00:23<01:31, 39.9MB/s]\u001b[A\u001b[A\n",
|
520 |
-
"model-00001-of-00003.safetensors: 23%|██▎ | 1.15G/4.98G [00:23<01:24, 45.5MB/s]\u001b[A\n",
|
521 |
-
"\n",
|
522 |
-
"model-00002-of-00003.safetensors: 27%|██▋ | 1.36G/4.98G [00:24<01:14, 48.4MB/s]\u001b[A\u001b[A\n",
|
523 |
-
"model-00001-of-00003.safetensors: 24%|██▎ | 1.17G/4.98G [00:24<01:18, 48.7MB/s]\u001b[A\n",
|
524 |
-
"model-00001-of-00003.safetensors: 24%|██▍ | 1.18G/4.98G [00:24<01:24, 45.1MB/s]\u001b[A\n",
|
525 |
-
"\n",
|
526 |
-
"model-00002-of-00003.safetensors: 28%|██▊ | 1.38G/4.98G [00:24<01:20, 44.7MB/s]\u001b[A\u001b[A\n",
|
527 |
-
"model-00001-of-00003.safetensors: 24%|██▍ | 1.21G/4.98G [00:24<01:12, 52.1MB/s]\u001b[A\n",
|
528 |
-
"\n",
|
529 |
-
"model-00002-of-00003.safetensors: 28%|██▊ | 1.39G/4.98G [00:24<01:19, 45.0MB/s]\u001b[A\u001b[A\n",
|
530 |
-
"model-00001-of-00003.safetensors: 24%|██▍ | 1.22G/4.98G [00:25<01:30, 41.8MB/s]\u001b[A\n",
|
531 |
-
"model-00001-of-00003.safetensors: 25%|██▍ | 1.24G/4.98G [00:25<01:11, 52.1MB/s]\u001b[A\n",
|
532 |
-
"model-00001-of-00003.safetensors: 25%|██▌ | 1.25G/4.98G [00:25<01:08, 54.3MB/s]\u001b[A\n",
|
533 |
-
"model-00001-of-00003.safetensors: 25%|██▌ | 1.26G/4.98G [00:25<01:03, 58.3MB/s]\u001b[A\n",
|
534 |
-
"\n",
|
535 |
-
"model-00002-of-00003.safetensors: 28%|██▊ | 1.41G/4.98G [00:25<02:25, 24.7MB/s]\u001b[A\u001b[A\n",
|
536 |
-
"model-00001-of-00003.safetensors: 25%|██▌ | 1.27G/4.98G [00:26<01:04, 57.8MB/s]\u001b[A\n",
|
537 |
-
"\n",
|
538 |
-
"model-00002-of-00003.safetensors: 29%|██▉ | 1.45G/4.98G [00:26<01:09, 51.1MB/s]\u001b[A\u001b[A\n",
|
539 |
-
"model-00001-of-00003.safetensors: 26%|██▌ | 1.28G/4.98G [00:26<00:57, 64.4MB/s]\u001b[A\n",
|
540 |
-
"model-00001-of-00003.safetensors: 26%|██▌ | 1.29G/4.98G [00:26<01:03, 58.3MB/s]\u001b[A\n",
|
541 |
-
"model-00001-of-00003.safetensors: 26%|██▌ | 1.30G/4.98G [00:26<01:09, 53.1MB/s]\u001b[A\n",
|
542 |
-
"\n",
|
543 |
-
"model-00002-of-00003.safetensors: 30%|██▉ | 1.49G/4.98G [00:26<00:57, 61.2MB/s]\u001b[A\u001b[A\n",
|
544 |
-
"model-00001-of-00003.safetensors: 26%|██▋ | 1.31G/4.98G [00:26<01:00, 60.9MB/s]\u001b[A\n",
|
545 |
-
"model-00001-of-00003.safetensors: 27%|██▋ | 1.32G/4.98G [00:26<01:09, 53.0MB/s]\u001b[A\n",
|
546 |
-
"\n",
|
547 |
-
"model-00002-of-00003.safetensors: 30%|███ | 1.51G/4.98G [00:27<01:03, 54.6MB/s]\u001b[A\u001b[A\n",
|
548 |
-
"model-00001-of-00003.safetensors: 27%|██▋ | 1.33G/4.98G [00:27<01:07, 54.1MB/s]\u001b[A\n",
|
549 |
-
"\n",
|
550 |
-
"model-00002-of-00003.safetensors: 31%|███ | 1.52G/4.98G [00:27<01:07, 51.3MB/s]\u001b[A\u001b[A\n",
|
551 |
-
"model-00001-of-00003.safetensors: 27%|██▋ | 1.35G/4.98G [00:27<01:02, 58.3MB/s]\u001b[A\n",
|
552 |
-
"model-00001-of-00003.safetensors: 27%|██▋ | 1.36G/4.98G [00:27<01:08, 52.6MB/s]\u001b[A\n",
|
553 |
-
"model-00001-of-00003.safetensors: 28%|██▊ | 1.37G/4.98G [00:27<01:10, 51.2MB/s]\u001b[A\n",
|
554 |
-
"\n",
|
555 |
-
"model-00002-of-00003.safetensors: 31%|███ | 1.54G/4.98G [00:27<01:15, 45.7MB/s]\u001b[A\u001b[A\n",
|
556 |
-
"model-00001-of-00003.safetensors: 28%|██▊ | 1.38G/4.98G [00:28<01:03, 56.4MB/s]\u001b[A\n",
|
557 |
-
"\n",
|
558 |
-
"model-00002-of-00003.safetensors: 31%|███ | 1.55G/4.98G [00:28<01:11, 47.7MB/s]\u001b[A\u001b[A\n",
|
559 |
-
"\n",
|
560 |
-
"model-00002-of-00003.safetensors: 31%|███▏ | 1.56G/4.98G [00:28<01:05, 52.1MB/s]\u001b[A\u001b[A\n",
|
561 |
-
"model-00001-of-00003.safetensors: 28%|██▊ | 1.39G/4.98G [00:28<01:12, 49.6MB/s]\u001b[A\n",
|
562 |
-
"model-00001-of-00003.safetensors: 28%|██▊ | 1.41G/4.98G [00:28<01:03, 56.5MB/s]\u001b[A\n",
|
563 |
-
"\n",
|
564 |
-
"model-00002-of-00003.safetensors: 32%|███▏ | 1.57G/4.98G [00:28<01:09, 49.2MB/s]\u001b[A\u001b[A\n",
|
565 |
-
"\n",
|
566 |
-
"model-00002-of-00003.safetensors: 32%|███▏ | 1.59G/4.98G [00:28<00:51, 66.4MB/s]\u001b[A\u001b[A\n",
|
567 |
-
"model-00001-of-00003.safetensors: 28%|██▊ | 1.42G/4.98G [00:28<01:17, 46.3MB/s]\u001b[A\n",
|
568 |
-
"\n",
|
569 |
-
"model-00002-of-00003.safetensors: 32%|███▏ | 1.60G/4.98G [00:28<00:51, 66.0MB/s]\u001b[A\u001b[A\n",
|
570 |
-
"model-00001-of-00003.safetensors: 29%|██▊ | 1.43G/4.98G [00:29<01:23, 42.8MB/s]\u001b[A\n",
|
571 |
-
"\n",
|
572 |
-
"model-00002-of-00003.safetensors: 33%|███▎ | 1.63G/4.98G [00:29<00:54, 61.8MB/s]\u001b[A\u001b[A\n",
|
573 |
-
"model-00001-of-00003.safetensors: 29%|██▉ | 1.44G/4.98G [00:29<01:12, 49.1MB/s]\u001b[A\n",
|
574 |
-
"\n",
|
575 |
-
"model-00002-of-00003.safetensors: 33%|███▎ | 1.64G/4.98G [00:29<00:51, 64.7MB/s]\u001b[A\u001b[A\n",
|
576 |
-
"model-00001-of-00003.safetensors: 29%|██▉ | 1.45G/4.98G [00:29<01:12, 48.8MB/s]\u001b[A\n",
|
577 |
-
"model-00001-of-00003.safetensors: 29%|██▉ | 1.46G/4.98G [00:29<01:06, 52.7MB/s]\u001b[A\n",
|
578 |
-
"\n",
|
579 |
-
"model-00002-of-00003.safetensors: 33%|███▎ | 1.66G/4.98G [00:29<00:51, 65.0MB/s]\u001b[A\u001b[A\n",
|
580 |
-
"model-00001-of-00003.safetensors: 30%|██▉ | 1.48G/4.98G [00:30<01:10, 49.4MB/s]\u001b[A\n",
|
581 |
-
"model-00001-of-00003.safetensors: 30%|██▉ | 1.49G/4.98G [00:30<01:04, 54.3MB/s]\u001b[A\n",
|
582 |
-
"model-00001-of-00003.safetensors: 30%|███ | 1.51G/4.98G [00:30<00:55, 62.2MB/s]\u001b[A\n",
|
583 |
-
"model-00001-of-00003.safetensors: 31%|███ | 1.52G/4.98G [00:30<00:57, 60.4MB/s]\u001b[A\n",
|
584 |
-
"model-00001-of-00003.safetensors: 31%|███ | 1.54G/4.98G [00:30<00:47, 72.7MB/s]\u001b[A\n",
|
585 |
-
"model-00001-of-00003.safetensors: 31%|███ | 1.55G/4.98G [00:31<00:54, 63.5MB/s]\u001b[A\n",
|
586 |
-
"\n",
|
587 |
-
"model-00002-of-00003.safetensors: 33%|███▎ | 1.67G/4.98G [00:31<02:21, 23.5MB/s]\u001b[A\u001b[A\n",
|
588 |
-
"\n",
|
589 |
-
"model-00002-of-00003.safetensors: 34%|███▍ | 1.71G/4.98G [00:31<01:07, 48.4MB/s]\u001b[A\u001b[A\n",
|
590 |
-
"model-00001-of-00003.safetensors: 31%|███▏ | 1.56G/4.98G [00:31<00:56, 60.2MB/s]\u001b[A\n",
|
591 |
-
"\n",
|
592 |
-
"model-00002-of-00003.safetensors: 35%|███▌ | 1.75G/4.98G [00:31<00:46, 69.8MB/s]\u001b[A\u001b[A\n",
|
593 |
-
"model-00001-of-00003.safetensors: 32%|███▏ | 1.57G/4.98G [00:31<01:05, 52.0MB/s]\u001b[A\n",
|
594 |
-
"\n",
|
595 |
-
"model-00002-of-00003.safetensors: 36%|███▌ | 1.77G/4.98G [00:31<00:45, 70.0MB/s]\u001b[A\u001b[A\n",
|
596 |
-
"model-00001-of-00003.safetensors: 32%|███▏ | 1.59G/4.98G [00:31<00:59, 56.5MB/s]\u001b[A\n",
|
597 |
-
"model-00001-of-00003.safetensors: 32%|███▏ | 1.60G/4.98G [00:32<01:13, 46.1MB/s]\u001b[A\n",
|
598 |
-
"\n",
|
599 |
-
"model-00002-of-00003.safetensors: 36%|███▌ | 1.79G/4.98G [00:32<00:55, 57.0MB/s]\u001b[A\u001b[A\n",
|
600 |
-
"\n",
|
601 |
-
"model-00002-of-00003.safetensors: 36%|███▋ | 1.81G/4.98G [00:32<00:49, 63.8MB/s]\u001b[A\u001b[A\n",
|
602 |
-
"model-00001-of-00003.safetensors: 33%|███▎ | 1.63G/4.98G [00:32<01:06, 50.4MB/s]\u001b[A\n",
|
603 |
-
"model-00001-of-00003.safetensors: 33%|███▎ | 1.64G/4.98G [00:32<01:02, 53.3MB/s]\u001b[A\n",
|
604 |
-
"\n",
|
605 |
-
"model-00002-of-00003.safetensors: 37%|███▋ | 1.82G/4.98G [00:32<00:56, 55.7MB/s]\u001b[A\u001b[A\n",
|
606 |
-
"model-00001-of-00003.safetensors: 33%|███▎ | 1.66G/4.98G [00:33<00:54, 61.0MB/s]\u001b[A\n",
|
607 |
-
"\n",
|
608 |
-
"model-00002-of-00003.safetensors: 37%|███▋ | 1.85G/4.98G [00:33<00:52, 59.9MB/s]\u001b[A\u001b[A\n",
|
609 |
-
"model-00001-of-00003.safetensors: 33%|███▎ | 1.67G/4.98G [00:33<01:04, 51.3MB/s]\u001b[A\n",
|
610 |
-
"\n",
|
611 |
-
"model-00002-of-00003.safetensors: 37%|███▋ | 1.86G/4.98G [00:33<00:50, 61.7MB/s]\u001b[A\u001b[A\n",
|
612 |
-
"\n",
|
613 |
-
"model-00002-of-00003.safetensors: 37%|███▋ | 1.87G/4.98G [00:33<00:46, 67.0MB/s]\u001b[A\u001b[A\n",
|
614 |
-
"model-00001-of-00003.safetensors: 34%|███▍ | 1.69G/4.98G [00:33<00:55, 59.5MB/s]\u001b[A\n",
|
615 |
-
"\n",
|
616 |
-
"model-00002-of-00003.safetensors: 38%|███▊ | 1.88G/4.98G [00:33<00:48, 64.3MB/s]\u001b[A\u001b[A\n",
|
617 |
-
"model-00001-of-00003.safetensors: 34%|███▍ | 1.70G/4.98G [00:33<00:52, 62.7MB/s]\u001b[A\n",
|
618 |
-
"model-00001-of-00003.safetensors: 35%|███▍ | 1.72G/4.98G [00:33<00:42, 76.9MB/s]\u001b[A\n",
|
619 |
-
"model-00001-of-00003.safetensors: 35%|███▍ | 1.73G/4.98G [00:34<00:47, 68.8MB/s]\u001b[A\n",
|
620 |
-
"\n",
|
621 |
-
"model-00002-of-00003.safetensors: 38%|███▊ | 1.90G/4.98G [00:34<00:57, 53.8MB/s]\u001b[A\u001b[A\n",
|
622 |
-
"\n",
|
623 |
-
"model-00002-of-00003.safetensors: 38%|███▊ | 1.91G/4.98G [00:34<01:02, 48.9MB/s]\u001b[A\u001b[A\n",
|
624 |
-
"model-00001-of-00003.safetensors: 35%|███▌ | 1.75G/4.98G [00:34<00:48, 66.3MB/s]\u001b[A\n",
|
625 |
-
"model-00001-of-00003.safetensors: 35%|███▌ | 1.76G/4.98G [00:34<00:45, 70.0MB/s]\u001b[A\n",
|
626 |
-
"\n",
|
627 |
-
"model-00002-of-00003.safetensors: 39%|███▊ | 1.93G/4.98G [00:34<00:58, 52.1MB/s]\u001b[A\u001b[A\n",
|
628 |
-
"model-00001-of-00003.safetensors: 36%|███▌ | 1.78G/4.98G [00:34<00:46, 68.6MB/s]\u001b[A\n",
|
629 |
-
"\n",
|
630 |
-
"model-00002-of-00003.safetensors: 39%|███▉ | 1.94G/4.98G [00:34<00:59, 50.8MB/s]\u001b[A\u001b[A\n",
|
631 |
-
"\n",
|
632 |
-
"model-00002-of-00003.safetensors: 39%|███▉ | 1.96G/4.98G [00:35<00:47, 64.2MB/s]\u001b[A\u001b[A\n",
|
633 |
-
"model-00001-of-00003.safetensors: 36%|███▌ | 1.79G/4.98G [00:35<00:57, 55.1MB/s]\u001b[A\n",
|
634 |
-
"\n",
|
635 |
-
"model-00002-of-00003.safetensors: 40%|███▉ | 1.97G/4.98G [00:35<00:46, 64.4MB/s]\u001b[A\u001b[A\n",
|
636 |
-
"model-00001-of-00003.safetensors: 36%|███▋ | 1.81G/4.98G [00:35<00:43, 72.5MB/s]\u001b[A\n",
|
637 |
-
"\n",
|
638 |
-
"model-00002-of-00003.safetensors: 40%|███▉ | 1.98G/4.98G [00:35<00:46, 63.9MB/s]\u001b[A\u001b[A\n",
|
639 |
-
"model-00001-of-00003.safetensors: 37%|███▋ | 1.82G/4.98G [00:35<00:46, 68.3MB/s]\u001b[A\n",
|
640 |
-
"\n",
|
641 |
-
"model-00002-of-00003.safetensors: 40%|███▉ | 1.99G/4.98G [00:35<00:44, 67.5MB/s]\u001b[A\u001b[A\n",
|
642 |
-
"model-00001-of-00003.safetensors: 37%|███▋ | 1.84G/4.98G [00:35<00:48, 65.1MB/s]\u001b[A\n",
|
643 |
-
"\n",
|
644 |
-
"model-00002-of-00003.safetensors: 40%|████ | 2.00G/4.98G [00:36<01:00, 49.1MB/s]\u001b[A\u001b[A\n",
|
645 |
-
"model-00001-of-00003.safetensors: 37%|███▋ | 1.85G/4.98G [00:36<01:02, 50.0MB/s]\u001b[A\n",
|
646 |
-
"\n",
|
647 |
-
"model-00002-of-00003.safetensors: 41%|████ | 2.02G/4.98G [00:36<00:43, 67.7MB/s]\u001b[A\u001b[A\n",
|
648 |
-
"model-00001-of-00003.safetensors: 37%|███▋ | 1.86G/4.98G [00:36<00:55, 56.1MB/s]\u001b[A\n",
|
649 |
-
"model-00001-of-00003.safetensors: 37%|███▋ | 1.87G/4.98G [00:36<00:53, 57.9MB/s]\u001b[A\n",
|
650 |
-
"\n",
|
651 |
-
"model-00002-of-00003.safetensors: 41%|████ | 2.03G/4.98G [00:36<00:53, 54.6MB/s]\u001b[A\u001b[A\n",
|
652 |
-
"\n",
|
653 |
-
"model-00002-of-00003.safetensors: 41%|████ | 2.06G/4.98G [00:36<00:42, 69.0MB/s]\u001b[A\u001b[A\n",
|
654 |
-
"model-00001-of-00003.safetensors: 38%|███▊ | 1.88G/4.98G [00:37<01:29, 34.9MB/s]\u001b[A\n",
|
655 |
-
"\n",
|
656 |
-
"model-00002-of-00003.safetensors: 41%|████▏ | 2.07G/4.98G [00:37<00:54, 53.3MB/s]\u001b[A\u001b[A\n",
|
657 |
-
"model-00001-of-00003.safetensors: 38%|███▊ | 1.89G/4.98G [00:37<01:12, 42.8MB/s]\u001b[A\n",
|
658 |
-
"\n",
|
659 |
-
"model-00002-of-00003.safetensors: 42%|████▏ | 2.09G/4.98G [00:37<00:47, 61.4MB/s]\u001b[A\u001b[A\n",
|
660 |
-
"\n",
|
661 |
-
"model-00002-of-00003.safetensors: 42%|████▏ | 2.10G/4.98G [00:37<00:50, 57.1MB/s]\u001b[A\u001b[A\n",
|
662 |
-
"model-00001-of-00003.safetensors: 38%|███▊ | 1.90G/4.98G [00:37<01:29, 34.4MB/s]\u001b[A\n",
|
663 |
-
"model-00001-of-00003.safetensors: 38%|███▊ | 1.91G/4.98G [00:37<01:18, 39.3MB/s]\u001b[A\n",
|
664 |
-
"\n",
|
665 |
-
"model-00002-of-00003.safetensors: 43%|████▎ | 2.12G/4.98G [00:37<00:47, 60.8MB/s]\u001b[A\u001b[A\n",
|
666 |
-
"\n",
|
667 |
-
"model-00002-of-00003.safetensors: 43%|████▎ | 2.13G/4.98G [00:37<00:46, 62.0MB/s]\u001b[A\u001b[A\n",
|
668 |
-
"model-00001-of-00003.safetensors: 39%|███▊ | 1.93G/4.98G [00:38<01:02, 49.2MB/s]\u001b[A\n",
|
669 |
-
"\n",
|
670 |
-
"model-00002-of-00003.safetensors: 43%|████▎ | 2.15G/4.98G [00:38<00:45, 61.9MB/s]\u001b[A\u001b[A\n",
|
671 |
-
"model-00001-of-00003.safetensors: 39%|███▉ | 1.94G/4.98G [00:38<01:08, 44.3MB/s]\u001b[A\n",
|
672 |
-
"\n",
|
673 |
-
"model-00002-of-00003.safetensors: 44%|████▎ | 2.17G/4.98G [00:38<00:35, 79.7MB/s]\u001b[A\u001b[A\n",
|
674 |
-
"model-00001-of-00003.safetensors: 39%|███▉ | 1.96G/4.98G [00:38<00:54, 55.6MB/s]\u001b[A\n",
|
675 |
-
"model-00001-of-00003.safetensors: 40%|███▉ | 1.97G/4.98G [00:38<00:54, 55.6MB/s]\u001b[A\n",
|
676 |
-
"\n",
|
677 |
-
"model-00002-of-00003.safetensors: 44%|████▍ | 2.18G/4.98G [00:39<01:04, 43.3MB/s]\u001b[A\u001b[A\n",
|
678 |
-
"model-00001-of-00003.safetensors: 40%|███▉ | 1.99G/4.98G [00:39<00:56, 53.4MB/s]\u001b[A\n",
|
679 |
-
"\n",
|
680 |
-
"model-00002-of-00003.safetensors: 45%|████▍ | 2.22G/4.98G [00:39<00:33, 81.5MB/s]\u001b[A\u001b[A\n",
|
681 |
-
"model-00001-of-00003.safetensors: 40%|████ | 2.00G/4.98G [00:39<00:58, 50.9MB/s]\u001b[A\n",
|
682 |
-
"model-00001-of-00003.safetensors: 41%|████ | 2.02G/4.98G [00:39<00:52, 56.5MB/s]\u001b[A\n",
|
683 |
-
"\n",
|
684 |
-
"model-00002-of-00003.safetensors: 45%|████▌ | 2.24G/4.98G [00:39<00:43, 62.6MB/s]\u001b[A\u001b[A\n",
|
685 |
-
"\n",
|
686 |
-
"model-00002-of-00003.safetensors: 45%|████▌ | 2.26G/4.98G [00:40<00:40, 66.4MB/s]\u001b[A\u001b[A\n",
|
687 |
-
"model-00001-of-00003.safetensors: 41%|████ | 2.03G/4.98G [00:40<01:08, 42.9MB/s]\u001b[A\n",
|
688 |
-
"\n",
|
689 |
-
"model-00002-of-00003.safetensors: 46%|████▌ | 2.29G/4.98G [00:40<00:43, 61.9MB/s]\u001b[A\u001b[A\n",
|
690 |
-
"model-00001-of-00003.safetensors: 41%|████ | 2.04G/4.98G [00:40<01:20, 36.3MB/s]\u001b[A\n",
|
691 |
-
"\n",
|
692 |
-
"model-00002-of-00003.safetensors: 46%|████▋ | 2.31G/4.98G [00:40<00:38, 69.2MB/s]\u001b[A\u001b[A\n",
|
693 |
-
"\n",
|
694 |
-
"model-00002-of-00003.safetensors: 47%|████▋ | 2.33G/4.98G [00:40<00:32, 82.5MB/s]\u001b[A\u001b[A\n",
|
695 |
-
"model-00001-of-00003.safetensors: 41%|████ | 2.06G/4.98G [00:41<01:24, 34.6MB/s]\u001b[A\n",
|
696 |
-
"\n",
|
697 |
-
"model-00002-of-00003.safetensors: 47%|████▋ | 2.35G/4.98G [00:41<00:30, 87.6MB/s]\u001b[A\u001b[A\n",
|
698 |
-
"model-00001-of-00003.safetensors: 41%|████▏ | 2.07G/4.98G [00:41<01:14, 39.2MB/s]\u001b[A\n",
|
699 |
-
"\n",
|
700 |
-
"model-00002-of-00003.safetensors: 48%|████▊ | 2.37G/4.98G [00:41<00:34, 75.4MB/s]\u001b[A\u001b[A\n",
|
701 |
-
"model-00001-of-00003.safetensors: 42%|████▏ | 2.09G/4.98G [00:41<00:59, 48.6MB/s]\u001b[A\n",
|
702 |
-
"\n",
|
703 |
-
"model-00002-of-00003.safetensors: 48%|████▊ | 2.38G/4.98G [00:42<01:16, 34.0MB/s]\u001b[A\u001b[A\n",
|
704 |
-
"model-00001-of-00003.safetensors: 42%|████▏ | 2.10G/4.98G [00:42<01:54, 25.2MB/s]\u001b[A\n",
|
705 |
-
"\n",
|
706 |
-
"model-00002-of-00003.safetensors: 49%|████▊ | 2.42G/4.98G [00:42<00:40, 62.6MB/s]\u001b[A\u001b[A\n",
|
707 |
-
"model-00001-of-00003.safetensors: 43%|████▎ | 2.15G/4.98G [00:42<00:46, 61.5MB/s]\u001b[A\n",
|
708 |
-
"model-00001-of-00003.safetensors: 44%|████▎ | 2.17G/4.98G [00:42<00:37, 74.7MB/s]\u001b[A\n",
|
709 |
-
"\n",
|
710 |
-
"model-00002-of-00003.safetensors: 49%|████▉ | 2.44G/4.98G [00:42<00:39, 64.0MB/s]\u001b[A\u001b[A\n",
|
711 |
-
"model-00001-of-00003.safetensors: 44%|████▍ | 2.19G/4.98G [00:42<00:33, 82.8MB/s]\u001b[A\n",
|
712 |
-
"\n",
|
713 |
-
"model-00002-of-00003.safetensors: 49%|████▉ | 2.46G/4.98G [00:43<00:39, 63.6MB/s]\u001b[A\u001b[A\n",
|
714 |
-
"\n",
|
715 |
-
"model-00002-of-00003.safetensors: 50%|████▉ | 2.49G/4.98G [00:43<00:33, 74.4MB/s]\u001b[A\u001b[A\n",
|
716 |
-
"model-00001-of-00003.safetensors: 44%|████▍ | 2.21G/4.98G [00:43<00:45, 60.8MB/s]\u001b[A\n",
|
717 |
-
"\n",
|
718 |
-
"model-00002-of-00003.safetensors: 50%|█████ | 2.51G/4.98G [00:43<00:32, 76.9MB/s]\u001b[A\u001b[A\n",
|
719 |
-
"model-00001-of-00003.safetensors: 45%|████▍ | 2.23G/4.98G [00:43<00:46, 58.6MB/s]\u001b[A\n",
|
720 |
-
"model-00001-of-00003.safetensors: 45%|████▌ | 2.24G/4.98G [00:44<00:52, 51.8MB/s]\u001b[A\n",
|
721 |
-
"\n",
|
722 |
-
"model-00002-of-00003.safetensors: 51%|█████ | 2.53G/4.98G [00:44<00:43, 56.8MB/s]\u001b[A\u001b[A\n",
|
723 |
-
"model-00001-of-00003.safetensors: 45%|████▌ | 2.26G/4.98G [00:44<00:45, 59.5MB/s]\u001b[A\n",
|
724 |
-
"\n",
|
725 |
-
"model-00002-of-00003.safetensors: 51%|█████ | 2.54G/4.98G [00:44<00:48, 50.3MB/s]\u001b[A\u001b[A\n",
|
726 |
-
"model-00001-of-00003.safetensors: 46%|████▌ | 2.28G/4.98G [00:44<00:44, 60.7MB/s]\u001b[A\n",
|
727 |
-
"\n",
|
728 |
-
"model-00002-of-00003.safetensors: 51%|█████ | 2.55G/4.98G [00:44<00:48, 49.9MB/s]\u001b[A\u001b[A\n",
|
729 |
-
"model-00001-of-00003.safetensors: 46%|████▌ | 2.30G/4.98G [00:45<00:47, 57.0MB/s]\u001b[A\n",
|
730 |
-
"\n",
|
731 |
-
"model-00002-of-00003.safetensors: 52%|█████▏ | 2.57G/4.98G [00:45<00:43, 55.7MB/s]\u001b[A\u001b[A\n",
|
732 |
-
"\n",
|
733 |
-
"model-00002-of-00003.safetensors: 52%|█████▏ | 2.58G/4.98G [00:45<00:51, 47.0MB/s]\u001b[A\u001b[A\n",
|
734 |
-
"model-00001-of-00003.safetensors: 46%|████▋ | 2.31G/4.98G [00:45<01:03, 42.0MB/s]\u001b[A\n",
|
735 |
-
"\n",
|
736 |
-
"model-00002-of-00003.safetensors: 52%|█████▏ | 2.60G/4.98G [00:45<00:45, 52.8MB/s]\u001b[A\u001b[A\n",
|
737 |
-
"\n",
|
738 |
-
"model-00002-of-00003.safetensors: 52%|█████▏ | 2.61G/4.98G [00:45<00:43, 54.3MB/s]\u001b[A\u001b[A\n",
|
739 |
-
"model-00001-of-00003.safetensors: 47%|████▋ | 2.33G/4.98G [00:46<01:11, 37.3MB/s]\u001b[A\n",
|
740 |
-
"\n",
|
741 |
-
"model-00002-of-00003.safetensors: 53%|█████▎ | 2.62G/4.98G [00:46<00:48, 49.0MB/s]\u001b[A\u001b[A\n",
|
742 |
-
"\n",
|
743 |
-
"model-00002-of-00003.safetensors: 53%|█████▎ | 2.63G/4.98G [00:46<00:44, 52.7MB/s]\u001b[A\u001b[A\n",
|
744 |
-
"model-00001-of-00003.safetensors: 47%|████▋ | 2.34G/4.98G [00:46<01:08, 38.5MB/s]\u001b[A\n",
|
745 |
-
"\n",
|
746 |
-
"model-00002-of-00003.safetensors: 53%|█████▎ | 2.64G/4.98G [00:46<00:43, 53.8MB/s]\u001b[A\u001b[A\n",
|
747 |
-
"model-00001-of-00003.safetensors: 47%|████▋ | 2.36G/4.98G [00:46<00:54, 47.9MB/s]\u001b[A\n",
|
748 |
-
"\n",
|
749 |
-
"model-00002-of-00003.safetensors: 53%|█████▎ | 2.66G/4.98G [00:46<00:38, 60.6MB/s]\u001b[A\u001b[A\n",
|
750 |
-
"\n",
|
751 |
-
"model-00002-of-00003.safetensors: 54%|█████▎ | 2.67G/4.98G [00:46<00:35, 64.7MB/s]\u001b[A\u001b[A\n",
|
752 |
-
"model-00001-of-00003.safetensors: 48%|████▊ | 2.37G/4.98G [00:47<01:00, 43.5MB/s]\u001b[A\n",
|
753 |
-
"\n",
|
754 |
-
"model-00002-of-00003.safetensors: 54%|█████▍ | 2.69G/4.98G [00:47<00:33, 69.1MB/s]\u001b[A\u001b[A\n",
|
755 |
-
"model-00001-of-00003.safetensors: 48%|████▊ | 2.39G/4.98G [00:47<00:53, 48.6MB/s]\u001b[A\n",
|
756 |
-
"model-00001-of-00003.safetensors: 48%|████▊ | 2.40G/4.98G [00:47<00:54, 47.7MB/s]\u001b[A\n",
|
757 |
-
"\n",
|
758 |
-
"model-00002-of-00003.safetensors: 54%|█████▍ | 2.71G/4.98G [00:47<00:43, 52.8MB/s]\u001b[A\u001b[A\n",
|
759 |
-
"model-00001-of-00003.safetensors: 49%|████▊ | 2.42G/4.98G [00:47<00:44, 57.3MB/s]\u001b[A\n",
|
760 |
-
"\n",
|
761 |
-
"model-00002-of-00003.safetensors: 55%|█████▍ | 2.73G/4.98G [00:47<00:36, 61.5MB/s]\u001b[A\u001b[A\n",
|
762 |
-
"model-00001-of-00003.safetensors: 49%|████▉ | 2.43G/4.98G [00:48<00:41, 61.0MB/s]\u001b[A\n",
|
763 |
-
"\n",
|
764 |
-
"model-00002-of-00003.safetensors: 55%|█████▍ | 2.74G/4.98G [00:48<00:40, 55.6MB/s]\u001b[A\u001b[A\n",
|
765 |
-
"model-00001-of-00003.safetensors: 49%|████▉ | 2.45G/4.98G [00:48<00:43, 58.5MB/s]\u001b[A\n",
|
766 |
-
"\n",
|
767 |
-
"model-00002-of-00003.safetensors: 55%|█████▌ | 2.76G/4.98G [00:48<00:40, 54.7MB/s]\u001b[A\u001b[A\n",
|
768 |
-
"model-00001-of-00003.safetensors: 49%|████▉ | 2.46G/4.98G [00:48<00:51, 49.0MB/s]\u001b[A\n",
|
769 |
-
"\n",
|
770 |
-
"model-00002-of-00003.safetensors: 56%|█████▌ | 2.77G/4.98G [00:48<00:42, 51.6MB/s]\u001b[A\u001b[A\n",
|
771 |
-
"\n",
|
772 |
-
"model-00002-of-00003.safetensors: 56%|█████▌ | 2.79G/4.98G [00:48<00:34, 63.3MB/s]\u001b[A\u001b[A\n",
|
773 |
-
"model-00001-of-00003.safetensors: 50%|████▉ | 2.49G/4.98G [00:49<00:47, 52.7MB/s]\u001b[A\n",
|
774 |
-
"model-00001-of-00003.safetensors: 50%|█████ | 2.50G/4.98G [00:49<00:51, 48.1MB/s]\u001b[A\n",
|
775 |
-
"\n",
|
776 |
-
"model-00002-of-00003.safetensors: 56%|█████▌ | 2.80G/4.98G [00:49<00:44, 49.5MB/s]\u001b[A\u001b[A\n",
|
777 |
-
"\n",
|
778 |
-
"model-00002-of-00003.safetensors: 56%|█████▋ | 2.81G/4.98G [00:49<00:40, 53.5MB/s]\u001b[A\u001b[A\n",
|
779 |
-
"model-00001-of-00003.safetensors: 50%|█████ | 2.51G/4.98G [00:49<00:48, 51.1MB/s]\u001b[A\n",
|
780 |
-
"model-00001-of-00003.safetensors: 51%|█████ | 2.52G/4.98G [00:49<00:45, 54.7MB/s]\u001b[A\n",
|
781 |
-
"\n",
|
782 |
-
"model-00002-of-00003.safetensors: 57%|█████▋ | 2.82G/4.98G [00:49<00:39, 55.4MB/s]\u001b[A\u001b[A\n",
|
783 |
-
"model-00001-of-00003.safetensors: 51%|█████ | 2.54G/4.98G [00:50<00:41, 58.9MB/s]\u001b[A\n",
|
784 |
-
"\n",
|
785 |
-
"model-00002-of-00003.safetensors: 57%|█████▋ | 2.84G/4.98G [00:50<00:42, 50.6MB/s]\u001b[A\u001b[A\n",
|
786 |
-
"\n",
|
787 |
-
"model-00002-of-00003.safetensors: 57%|█████▋ | 2.85G/4.98G [00:50<00:44, 47.9MB/s]\u001b[A\u001b[A\n",
|
788 |
-
"model-00001-of-00003.safetensors: 51%|█████ | 2.55G/4.98G [00:50<00:54, 44.4MB/s]\u001b[A\n",
|
789 |
-
"model-00001-of-00003.safetensors: 52%|█████▏ | 2.57G/4.98G [00:50<00:43, 55.0MB/s]\u001b[A\n",
|
790 |
-
"model-00001-of-00003.safetensors: 52%|█████▏ | 2.58G/4.98G [00:50<00:44, 53.7MB/s]\u001b[A\n",
|
791 |
-
"\n",
|
792 |
-
"model-00002-of-00003.safetensors: 58%|█████▊ | 2.87G/4.98G [00:50<00:49, 42.3MB/s]\u001b[A\u001b[A\n",
|
793 |
-
"\n",
|
794 |
-
"model-00002-of-00003.safetensors: 58%|█████▊ | 2.89G/4.98G [00:51<00:35, 58.2MB/s]\u001b[A\u001b[A\n",
|
795 |
-
"model-00001-of-00003.safetensors: 52%|█████▏ | 2.60G/4.98G [00:51<00:44, 54.0MB/s]\u001b[A\n",
|
796 |
-
"\n",
|
797 |
-
"model-00002-of-00003.safetensors: 58%|█████▊ | 2.90G/4.98G [00:51<00:43, 47.9MB/s]\u001b[A\u001b[A\n",
|
798 |
-
"model-00001-of-00003.safetensors: 52%|█████▏ | 2.61G/4.98G [00:51<00:45, 51.7MB/s]\u001b[A\n",
|
799 |
-
"\n",
|
800 |
-
"model-00002-of-00003.safetensors: 59%|█████▊ | 2.92G/4.98G [00:51<00:41, 49.8MB/s]\u001b[A\u001b[A\n",
|
801 |
-
"model-00001-of-00003.safetensors: 53%|█████▎ | 2.63G/4.98G [00:51<00:43, 54.6MB/s]\u001b[A\n",
|
802 |
-
"\n",
|
803 |
-
"model-00002-of-00003.safetensors: 59%|█████▉ | 2.94G/4.98G [00:51<00:32, 62.3MB/s]\u001b[A\u001b[A\n",
|
804 |
-
"model-00001-of-00003.safetensors: 53%|█████▎ | 2.64G/4.98G [00:52<00:40, 57.5MB/s]\u001b[A\n",
|
805 |
-
"\n",
|
806 |
-
"model-00002-of-00003.safetensors: 59%|█████▉ | 2.95G/4.98G [00:52<00:37, 54.4MB/s]\u001b[A\u001b[A\n",
|
807 |
-
"model-00001-of-00003.safetensors: 53%|█████▎ | 2.65G/4.98G [00:52<00:47, 49.0MB/s]\u001b[A\n",
|
808 |
-
"model-00001-of-00003.safetensors: 53%|█████▎ | 2.66G/4.98G [00:52<00:42, 54.4MB/s]\u001b[A\n",
|
809 |
-
"\n",
|
810 |
-
"model-00002-of-00003.safetensors: 60%|█████▉ | 2.97G/4.98G [00:52<00:38, 52.1MB/s]\u001b[A\u001b[A\n",
|
811 |
-
"model-00001-of-00003.safetensors: 54%|█████▎ | 2.67G/4.98G [00:52<00:48, 47.1MB/s]\u001b[A\n",
|
812 |
-
"\n",
|
813 |
-
"model-00002-of-00003.safetensors: 60%|█████▉ | 2.98G/4.98G [00:52<00:38, 51.6MB/s]\u001b[A\u001b[A\n",
|
814 |
-
"model-00001-of-00003.safetensors: 54%|█████▍ | 2.69G/4.98G [00:53<00:39, 57.3MB/s]\u001b[A\n",
|
815 |
-
"model-00001-of-00003.safetensors: 54%|█████▍ | 2.71G/4.98G [00:53<00:42, 53.5MB/s]\u001b[A\n",
|
816 |
-
"\n",
|
817 |
-
"model-00002-of-00003.safetensors: 60%|█████▉ | 2.99G/4.98G [00:53<00:53, 37.6MB/s]\u001b[A\u001b[A\n",
|
818 |
-
"model-00001-of-00003.safetensors: 55%|█████▍ | 2.73G/4.98G [00:53<00:40, 55.8MB/s]\u001b[A\n",
|
819 |
-
"model-00001-of-00003.safetensors: 55%|█████▍ | 2.74G/4.98G [00:53<00:38, 58.2MB/s]\u001b[A\n",
|
820 |
-
"\n",
|
821 |
-
"model-00002-of-00003.safetensors: 60%|██████ | 3.00G/4.98G [00:54<01:15, 26.3MB/s]\u001b[A\u001b[A\n",
|
822 |
-
"model-00001-of-00003.safetensors: 55%|█████▌ | 2.76G/4.98G [00:54<00:36, 60.6MB/s]\u001b[A\n",
|
823 |
-
"\n",
|
824 |
-
"model-00002-of-00003.safetensors: 60%|██████ | 3.01G/4.98G [00:54<01:00, 32.5MB/s]\u001b[A\u001b[A\n",
|
825 |
-
"model-00001-of-00003.safetensors: 56%|█████▌ | 2.77G/4.98G [00:54<00:39, 55.8MB/s]\u001b[A\n",
|
826 |
-
"model-00001-of-00003.safetensors: 56%|█████▌ | 2.79G/4.98G [00:54<00:31, 68.8MB/s]\u001b[A\n",
|
827 |
-
"\n",
|
828 |
-
"model-00002-of-00003.safetensors: 61%|██████ | 3.03G/4.98G [00:54<00:47, 40.9MB/s]\u001b[A\u001b[A\n",
|
829 |
-
"model-00001-of-00003.safetensors: 56%|█████▌ | 2.80G/4.98G [00:54<00:33, 65.2MB/s]\u001b[A\n",
|
830 |
-
"model-00001-of-00003.safetensors: 56%|█████▋ | 2.81G/4.98G [00:54<00:34, 63.7MB/s]\u001b[A\n",
|
831 |
-
"model-00001-of-00003.safetensors: 57%|█████▋ | 2.82G/4.98G [00:55<00:32, 66.4MB/s]\u001b[A\n",
|
832 |
-
"\n",
|
833 |
-
"model-00002-of-00003.safetensors: 61%|██████ | 3.04G/4.98G [00:55<01:01, 31.4MB/s]\u001b[A\u001b[A\n",
|
834 |
-
"model-00001-of-00003.safetensors: 57%|█████▋ | 2.84G/4.98G [00:55<00:30, 70.3MB/s]\u001b[A\n",
|
835 |
-
"\n",
|
836 |
-
"model-00002-of-00003.safetensors: 61%|██████▏ | 3.06G/4.98G [00:55<00:43, 44.0MB/s]\u001b[A\u001b[A\n",
|
837 |
-
"model-00001-of-00003.safetensors: 57%|█████▋ | 2.85G/4.98G [00:55<00:35, 60.6MB/s]\u001b[A\n",
|
838 |
-
"\n",
|
839 |
-
"model-00002-of-00003.safetensors: 62%|██████▏ | 3.07G/4.98G [00:55<00:50, 38.0MB/s]\u001b[A\u001b[A\n",
|
840 |
-
"model-00001-of-00003.safetensors: 58%|█████▊ | 2.87G/4.98G [00:55<00:33, 63.4MB/s]\u001b[A\n",
|
841 |
-
"\n",
|
842 |
-
"model-00002-of-00003.safetensors: 62%|██████▏ | 3.08G/4.98G [00:55<00:44, 42.3MB/s]\u001b[A\u001b[A\n",
|
843 |
-
"model-00001-of-00003.safetensors: 58%|█████▊ | 2.88G/4.98G [00:55<00:30, 68.2MB/s]\u001b[A\n",
|
844 |
-
"\n",
|
845 |
-
"model-00002-of-00003.safetensors: 62%|██████▏ | 3.09G/4.98G [00:55<00:39, 47.7MB/s]\u001b[A\u001b[A\n",
|
846 |
-
"\n",
|
847 |
-
"model-00002-of-00003.safetensors: 62%|██████▏ | 3.10G/4.98G [00:56<00:34, 54.4MB/s]\u001b[A\u001b[A\n",
|
848 |
-
"model-00001-of-00003.safetensors: 58%|█████▊ | 2.90G/4.98G [00:56<00:27, 76.3MB/s]\u001b[A\n",
|
849 |
-
"\n",
|
850 |
-
"model-00002-of-00003.safetensors: 63%|██████▎ | 3.11G/4.98G [00:56<00:34, 54.1MB/s]\u001b[A\u001b[A\n",
|
851 |
-
"model-00001-of-00003.safetensors: 59%|█████▊ | 2.92G/4.98G [00:56<00:31, 66.5MB/s]\u001b[A\n",
|
852 |
-
"\n",
|
853 |
-
"model-00002-of-00003.safetensors: 63%|██████▎ | 3.12G/4.98G [00:56<00:31, 59.4MB/s]\u001b[A\u001b[A\n",
|
854 |
-
"\n",
|
855 |
-
"model-00002-of-00003.safetensors: 63%|██████▎ | 3.15G/4.98G [00:56<00:29, 62.9MB/s]\u001b[A\u001b[A\n",
|
856 |
-
"\n",
|
857 |
-
"model-00002-of-00003.safetensors: 64%|██████▎ | 3.17G/4.98G [00:56<00:22, 82.3MB/s]\u001b[A\u001b[A\n",
|
858 |
-
"model-00001-of-00003.safetensors: 59%|█████▉ | 2.94G/4.98G [00:56<00:37, 54.7MB/s]\u001b[A\n",
|
859 |
-
"\n",
|
860 |
-
"model-00002-of-00003.safetensors: 64%|██████▍ | 3.18G/4.98G [00:56<00:21, 85.1MB/s]\u001b[A\u001b[A\n",
|
861 |
-
"model-00001-of-00003.safetensors: 59%|█████▉ | 2.95G/4.98G [00:57<00:35, 57.5MB/s]\u001b[A\n",
|
862 |
-
"\n",
|
863 |
-
"model-00002-of-00003.safetensors: 64%|██████▍ | 3.19G/4.98G [00:57<00:20, 87.9MB/s]\u001b[A\u001b[A\n",
|
864 |
-
"model-00001-of-00003.safetensors: 60%|█████▉ | 2.97G/4.98G [00:57<00:34, 58.6MB/s]\u001b[A\n",
|
865 |
-
"\n",
|
866 |
-
"model-00002-of-00003.safetensors: 64%|██████▍ | 3.21G/4.98G [00:57<00:23, 76.9MB/s]\u001b[A\u001b[A\n",
|
867 |
-
"model-00001-of-00003.safetensors: 60%|█████▉ | 2.98G/4.98G [00:57<00:35, 55.8MB/s]\u001b[A\n",
|
868 |
-
"\n",
|
869 |
-
"model-00002-of-00003.safetensors: 65%|██████▍ | 3.22G/4.98G [00:57<00:27, 64.2MB/s]\u001b[A\u001b[A\n",
|
870 |
-
"\n",
|
871 |
-
"model-00002-of-00003.safetensors: 65%|██████▍ | 3.23G/4.98G [00:57<00:26, 66.6MB/s]\u001b[A\u001b[A\n",
|
872 |
-
"\n",
|
873 |
-
"model-00002-of-00003.safetensors: 65%|██████▌ | 3.24G/4.98G [00:57<00:27, 62.3MB/s]\u001b[A\u001b[A\n",
|
874 |
-
"model-00001-of-00003.safetensors: 60%|██████ | 3.00G/4.98G [00:58<00:39, 49.9MB/s]\u001b[A\n",
|
875 |
-
"\n",
|
876 |
-
"model-00002-of-00003.safetensors: 65%|██████▌ | 3.25G/4.98G [00:58<00:35, 48.5MB/s]\u001b[A\u001b[A\n",
|
877 |
-
"model-00001-of-00003.safetensors: 60%|██████ | 3.01G/4.98G [00:58<00:42, 46.5MB/s]\u001b[A\n",
|
878 |
-
"\n",
|
879 |
-
"model-00002-of-00003.safetensors: 65%|██████▌ | 3.26G/4.98G [00:58<00:45, 38.2MB/s]\u001b[A\u001b[A\n",
|
880 |
-
"model-00001-of-00003.safetensors: 61%|██████ | 3.03G/4.98G [00:58<00:40, 47.8MB/s]\u001b[A\n",
|
881 |
-
"\n",
|
882 |
-
"model-00002-of-00003.safetensors: 66%|██████▌ | 3.27G/4.98G [00:59<00:49, 34.8MB/s]\u001b[A\u001b[A\n",
|
883 |
-
"model-00001-of-00003.safetensors: 61%|██████ | 3.04G/4.98G [00:59<00:50, 38.8MB/s]\u001b[A\n",
|
884 |
-
"\n",
|
885 |
-
"model-00002-of-00003.safetensors: 66%|██████▌ | 3.28G/4.98G [00:59<00:48, 34.7MB/s]\u001b[A\u001b[A\n",
|
886 |
-
"model-00001-of-00003.safetensors: 61%|██████ | 3.05G/4.98G [00:59<00:56, 34.3MB/s]\u001b[A\n",
|
887 |
-
"\n",
|
888 |
-
"model-00002-of-00003.safetensors: 66%|██████▋ | 3.30G/4.98G [00:59<00:39, 42.6MB/s]\u001b[A\u001b[A\n",
|
889 |
-
"model-00001-of-00003.safetensors: 61%|██████▏ | 3.06G/4.98G [00:59<00:49, 38.9MB/s]\u001b[A\n",
|
890 |
-
"model-00001-of-00003.safetensors: 62%|██████▏ | 3.07G/4.98G [01:00<00:45, 41.8MB/s]\u001b[A\n",
|
891 |
-
"\n",
|
892 |
-
"model-00002-of-00003.safetensors: 67%|██████▋ | 3.31G/4.98G [01:00<00:40, 41.3MB/s]\u001b[A\u001b[A\n",
|
893 |
-
"\n",
|
894 |
-
"model-00002-of-00003.safetensors: 67%|██████▋ | 3.33G/4.98G [01:00<00:30, 54.2MB/s]\u001b[A\u001b[A\n",
|
895 |
-
"\n",
|
896 |
-
"model-00002-of-00003.safetensors: 67%|██████▋ | 3.34G/4.98G [01:00<00:29, 54.8MB/s]\u001b[A\u001b[A\n",
|
897 |
-
"model-00001-of-00003.safetensors: 62%|██████▏ | 3.09G/4.98G [01:00<00:47, 39.6MB/s]\u001b[A\n",
|
898 |
-
"\n",
|
899 |
-
"model-00002-of-00003.safetensors: 68%|██████▊ | 3.37G/4.98G [01:00<00:26, 61.1MB/s]\u001b[A\u001b[A\n",
|
900 |
-
"model-00001-of-00003.safetensors: 63%|██████▎ | 3.11G/4.98G [01:00<00:37, 50.2MB/s]\u001b[A\n",
|
901 |
-
"\n",
|
902 |
-
"model-00002-of-00003.safetensors: 68%|██████▊ | 3.39G/4.98G [01:00<00:20, 79.3MB/s]\u001b[A\u001b[A\n",
|
903 |
-
"\n",
|
904 |
-
"model-00002-of-00003.safetensors: 68%|██████▊ | 3.40G/4.98G [01:01<00:20, 76.9MB/s]\u001b[A\u001b[A\n",
|
905 |
-
"model-00001-of-00003.safetensors: 63%|██████▎ | 3.12G/4.98G [01:01<00:37, 49.1MB/s]\u001b[A\n",
|
906 |
-
"model-00001-of-00003.safetensors: 63%|██████▎ | 3.14G/4.98G [01:01<00:33, 55.2MB/s]\u001b[A\n",
|
907 |
-
"\n",
|
908 |
-
"model-00002-of-00003.safetensors: 69%|██████▊ | 3.42G/4.98G [01:01<00:18, 82.6MB/s]\u001b[A\u001b[A\n",
|
909 |
-
"model-00001-of-00003.safetensors: 63%|██████▎ | 3.15G/4.98G [01:01<00:40, 45.3MB/s]\u001b[A\n",
|
910 |
-
"\n",
|
911 |
-
"model-00002-of-00003.safetensors: 69%|██████▉ | 3.43G/4.98G [01:01<00:24, 63.2MB/s]\u001b[A\u001b[A\n",
|
912 |
-
"model-00001-of-00003.safetensors: 63%|██████▎ | 3.16G/4.98G [01:01<00:37, 48.3MB/s]\u001b[A\n",
|
913 |
-
"\n",
|
914 |
-
"model-00002-of-00003.safetensors: 69%|██████▉ | 3.45G/4.98G [01:01<00:21, 69.7MB/s]\u001b[A\u001b[A\n",
|
915 |
-
"model-00001-of-00003.safetensors: 64%|██████▍ | 3.18G/4.98G [01:02<00:32, 56.1MB/s]\u001b[A\n",
|
916 |
-
"\n",
|
917 |
-
"model-00002-of-00003.safetensors: 69%|██████▉ | 3.46G/4.98G [01:02<00:25, 58.6MB/s]\u001b[A\u001b[A\n",
|
918 |
-
"model-00001-of-00003.safetensors: 64%|██████▍ | 3.19G/4.98G [01:02<00:32, 55.5MB/s]\u001b[A\n",
|
919 |
-
"\n",
|
920 |
-
"model-00002-of-00003.safetensors: 70%|██████▉ | 3.47G/4.98G [01:02<00:27, 55.6MB/s]\u001b[A\u001b[A\n",
|
921 |
-
"model-00001-of-00003.safetensors: 64%|██████▍ | 3.20G/4.98G [01:02<00:30, 57.7MB/s]\u001b[A\n",
|
922 |
-
"model-00001-of-00003.safetensors: 64%|██████▍ | 3.21G/4.98G [01:02<00:31, 57.2MB/s]\u001b[A\n",
|
923 |
-
"\n",
|
924 |
-
"model-00002-of-00003.safetensors: 70%|██████▉ | 3.48G/4.98G [01:02<00:29, 50.2MB/s]\u001b[A\u001b[A\n",
|
925 |
-
"model-00001-of-00003.safetensors: 65%|██████▍ | 3.22G/4.98G [01:02<00:28, 61.9MB/s]\u001b[A\n",
|
926 |
-
"model-00001-of-00003.safetensors: 65%|██████▌ | 3.24G/4.98G [01:03<00:26, 64.7MB/s]\u001b[A\n",
|
927 |
-
"\n",
|
928 |
-
"model-00002-of-00003.safetensors: 70%|███████ | 3.49G/4.98G [01:02<00:37, 40.0MB/s]\u001b[A\u001b[A\n",
|
929 |
-
"model-00001-of-00003.safetensors: 65%|██████▌ | 3.25G/4.98G [01:03<00:25, 68.5MB/s]\u001b[A\n",
|
930 |
-
"\n",
|
931 |
-
"model-00002-of-00003.safetensors: 71%|███████ | 3.51G/4.98G [01:03<00:26, 54.8MB/s]\u001b[A\u001b[A\n",
|
932 |
-
"model-00001-of-00003.safetensors: 66%|██████▌ | 3.27G/4.98G [01:03<00:20, 83.3MB/s]\u001b[A\n",
|
933 |
-
"\n",
|
934 |
-
"model-00002-of-00003.safetensors: 71%|███████ | 3.52G/4.98G [01:03<00:27, 52.4MB/s]\u001b[A\u001b[A\n",
|
935 |
-
"model-00001-of-00003.safetensors: 66%|██████▌ | 3.28G/4.98G [01:03<00:23, 72.0MB/s]\u001b[A\n",
|
936 |
-
"model-00001-of-00003.safetensors: 66%|██████▋ | 3.30G/4.98G [01:03<00:20, 81.1MB/s]\u001b[A\n",
|
937 |
-
"\n",
|
938 |
-
"model-00002-of-00003.safetensors: 71%|███████ | 3.54G/4.98G [01:03<00:25, 55.9MB/s]\u001b[A\u001b[A\n",
|
939 |
-
"model-00001-of-00003.safetensors: 67%|██████▋ | 3.31G/4.98G [01:03<00:23, 71.8MB/s]\u001b[A\n",
|
940 |
-
"model-00001-of-00003.safetensors: 67%|██████▋ | 3.33G/4.98G [01:04<00:21, 76.1MB/s]\u001b[A\n",
|
941 |
-
"\n",
|
942 |
-
"model-00002-of-00003.safetensors: 71%|███████▏ | 3.55G/4.98G [01:04<00:32, 44.5MB/s]\u001b[A\u001b[A\n",
|
943 |
-
"\n",
|
944 |
-
"model-00002-of-00003.safetensors: 72%|███████▏ | 3.57G/4.98G [01:04<00:29, 47.3MB/s]\u001b[A\u001b[A\n",
|
945 |
-
"model-00001-of-00003.safetensors: 67%|██████▋ | 3.34G/4.98G [01:04<00:25, 63.2MB/s]\u001b[A\n",
|
946 |
-
"\n",
|
947 |
-
"model-00002-of-00003.safetensors: 72%|███████▏ | 3.58G/4.98G [01:04<00:27, 51.8MB/s]\u001b[A\u001b[A\n",
|
948 |
-
"\n",
|
949 |
-
"model-00002-of-00003.safetensors: 72%|███████▏ | 3.59G/4.98G [01:04<00:26, 53.2MB/s]\u001b[A\u001b[A\n",
|
950 |
-
"model-00001-of-00003.safetensors: 68%|██████▊ | 3.37G/4.98G [01:04<00:24, 66.1MB/s]\u001b[A\n",
|
951 |
-
"\n",
|
952 |
-
"model-00002-of-00003.safetensors: 72%|███████▏ | 3.60G/4.98G [01:04<00:27, 50.6MB/s]\u001b[A\u001b[A\n",
|
953 |
-
"model-00001-of-00003.safetensors: 68%|██████▊ | 3.38G/4.98G [01:04<00:26, 60.9MB/s]\u001b[A\n",
|
954 |
-
"\n",
|
955 |
-
"model-00002-of-00003.safetensors: 72%|███████▏ | 3.61G/4.98G [01:05<00:27, 50.8MB/s]\u001b[A\u001b[A\n",
|
956 |
-
"model-00001-of-00003.safetensors: 68%|██████▊ | 3.40G/4.98G [01:05<00:30, 52.4MB/s]\u001b[A\n",
|
957 |
-
"\n",
|
958 |
-
"model-00002-of-00003.safetensors: 73%|███████▎ | 3.62G/4.98G [01:05<00:32, 41.8MB/s]\u001b[A\u001b[A\n",
|
959 |
-
"model-00001-of-00003.safetensors: 68%|██████▊ | 3.41G/4.98G [01:05<00:32, 48.1MB/s]\u001b[A\n",
|
960 |
-
"\n",
|
961 |
-
"model-00002-of-00003.safetensors: 73%|███████▎ | 3.64G/4.98G [01:05<00:25, 52.3MB/s]\u001b[A\u001b[A\n",
|
962 |
-
"model-00001-of-00003.safetensors: 69%|██████▊ | 3.42G/4.98G [01:05<00:31, 50.3MB/s]\u001b[A\n",
|
963 |
-
"\n",
|
964 |
-
"model-00002-of-00003.safetensors: 73%|███████▎ | 3.65G/4.98G [01:05<00:26, 50.8MB/s]\u001b[A\u001b[A\n",
|
965 |
-
"model-00001-of-00003.safetensors: 69%|██████▉ | 3.43G/4.98G [01:06<00:36, 42.9MB/s]\u001b[A\n",
|
966 |
-
"\n",
|
967 |
-
"model-00002-of-00003.safetensors: 74%|███████▎ | 3.67G/4.98G [01:06<00:23, 55.1MB/s]\u001b[A\u001b[A\n",
|
968 |
-
"model-00001-of-00003.safetensors: 69%|██████▉ | 3.45G/4.98G [01:06<00:26, 58.5MB/s]\u001b[A\n",
|
969 |
-
"\n",
|
970 |
-
"model-00002-of-00003.safetensors: 74%|███████▍ | 3.68G/4.98G [01:06<00:26, 48.4MB/s]\u001b[A\u001b[A\n",
|
971 |
-
"model-00001-of-00003.safetensors: 69%|██████▉ | 3.46G/4.98G [01:06<00:26, 56.4MB/s]\u001b[A\n",
|
972 |
-
"model-00001-of-00003.safetensors: 70%|██████▉ | 3.47G/4.98G [01:06<00:25, 59.9MB/s]\u001b[A\n",
|
973 |
-
"\n",
|
974 |
-
"model-00002-of-00003.safetensors: 74%|███████▍ | 3.70G/4.98G [01:06<00:23, 55.0MB/s]\u001b[A\u001b[A\n",
|
975 |
-
"model-00001-of-00003.safetensors: 70%|██████▉ | 3.48G/4.98G [01:07<00:28, 52.7MB/s]\u001b[A\n",
|
976 |
-
"\n",
|
977 |
-
"model-00002-of-00003.safetensors: 74%|███████▍ | 3.71G/4.98G [01:07<00:24, 52.0MB/s]\u001b[A\u001b[A\n",
|
978 |
-
"\n",
|
979 |
-
"model-00002-of-00003.safetensors: 75%|███████▍ | 3.72G/4.98G [01:07<00:22, 55.7MB/s]\u001b[A\u001b[A\n",
|
980 |
-
"model-00001-of-00003.safetensors: 70%|███████ | 3.49G/4.98G [01:07<00:40, 36.7MB/s]\u001b[A\n",
|
981 |
-
"\n",
|
982 |
-
"model-00002-of-00003.safetensors: 75%|███████▍ | 3.73G/4.98G [01:07<00:25, 49.0MB/s]\u001b[A\u001b[A\n",
|
983 |
-
"\n",
|
984 |
-
"model-00002-of-00003.safetensors: 75%|███████▌ | 3.74G/4.98G [01:07<00:24, 51.3MB/s]\u001b[A\u001b[A\n",
|
985 |
-
"model-00001-of-00003.safetensors: 71%|███████ | 3.51G/4.98G [01:07<00:33, 43.3MB/s]\u001b[A\n",
|
986 |
-
"\n",
|
987 |
-
"model-00002-of-00003.safetensors: 75%|███████▌ | 3.75G/4.98G [01:07<00:24, 50.2MB/s]\u001b[A\u001b[A\n",
|
988 |
-
"\n",
|
989 |
-
"model-00002-of-00003.safetensors: 76%|███████▌ | 3.76G/4.98G [01:08<00:21, 55.6MB/s]\u001b[A\u001b[A\n",
|
990 |
-
"model-00001-of-00003.safetensors: 71%|███████ | 3.52G/4.98G [01:08<00:33, 44.0MB/s]\u001b[A\n",
|
991 |
-
"model-00001-of-00003.safetensors: 71%|███████ | 3.54G/4.98G [01:08<00:28, 50.8MB/s]\u001b[A\n",
|
992 |
-
"\n",
|
993 |
-
"model-00002-of-00003.safetensors: 76%|███████▌ | 3.79G/4.98G [01:08<00:23, 50.9MB/s]\u001b[A\u001b[A\n",
|
994 |
-
"\n",
|
995 |
-
"model-00002-of-00003.safetensors: 76%|███████▌ | 3.80G/4.98G [01:08<00:24, 48.8MB/s]\u001b[A\u001b[A\n",
|
996 |
-
"model-00001-of-00003.safetensors: 71%|███████▏ | 3.55G/4.98G [01:09<00:37, 38.3MB/s]\u001b[A\n",
|
997 |
-
"\n",
|
998 |
-
"model-00002-of-00003.safetensors: 77%|███████▋ | 3.82G/4.98G [01:09<00:18, 62.7MB/s]\u001b[A\u001b[A\n",
|
999 |
-
"model-00001-of-00003.safetensors: 72%|███████▏ | 3.57G/4.98G [01:09<00:32, 43.8MB/s]\u001b[A\n",
|
1000 |
-
"\n",
|
1001 |
-
"model-00002-of-00003.safetensors: 77%|███████▋ | 3.83G/4.98G [01:09<00:19, 58.1MB/s]\u001b[A\u001b[A\n",
|
1002 |
-
"model-00001-of-00003.safetensors: 72%|███████▏ | 3.58G/4.98G [01:09<00:31, 44.2MB/s]\u001b[A\n",
|
1003 |
-
"model-00001-of-00003.safetensors: 72%|███████▏ | 3.59G/4.98G [01:09<00:28, 49.5MB/s]\u001b[A\n",
|
1004 |
-
"\n",
|
1005 |
-
"model-00002-of-00003.safetensors: 77%|███████▋ | 3.85G/4.98G [01:09<00:18, 59.8MB/s]\u001b[A\u001b[A\n",
|
1006 |
-
"\n",
|
1007 |
-
"model-00002-of-00003.safetensors: 77%|███████▋ | 3.86G/4.98G [01:09<00:22, 48.9MB/s]\u001b[A\u001b[A\n",
|
1008 |
-
"model-00001-of-00003.safetensors: 72%|███████▏ | 3.61G/4.98G [01:10<00:32, 42.0MB/s]\u001b[A\n",
|
1009 |
-
"\n",
|
1010 |
-
"model-00002-of-00003.safetensors: 78%|███████▊ | 3.89G/4.98G [01:10<00:14, 73.6MB/s]\u001b[A\u001b[A\n",
|
1011 |
-
"model-00001-of-00003.safetensors: 73%|███████▎ | 3.62G/4.98G [01:10<00:34, 39.1MB/s]\u001b[A\n",
|
1012 |
-
"\n",
|
1013 |
-
"model-00002-of-00003.safetensors: 78%|███████▊ | 3.91G/4.98G [01:10<00:16, 64.8MB/s]\u001b[A\u001b[A\n",
|
1014 |
-
"\n",
|
1015 |
-
"model-00002-of-00003.safetensors: 79%|███████▊ | 3.92G/4.98G [01:10<00:17, 61.5MB/s]\u001b[A\u001b[A\n",
|
1016 |
-
"model-00001-of-00003.safetensors: 73%|███████▎ | 3.64G/4.98G [01:10<00:30, 44.2MB/s]\u001b[A\n",
|
1017 |
-
"model-00001-of-00003.safetensors: 73%|███████▎ | 3.65G/4.98G [01:11<00:30, 43.3MB/s]\u001b[A\n",
|
1018 |
-
"\n",
|
1019 |
-
"model-00002-of-00003.safetensors: 79%|███████▉ | 3.94G/4.98G [01:11<00:18, 56.2MB/s]\u001b[A\u001b[A\n",
|
1020 |
-
"\n",
|
1021 |
-
"model-00002-of-00003.safetensors: 79%|███████▉ | 3.95G/4.98G [01:11<00:18, 56.3MB/s]\u001b[A\u001b[A\n",
|
1022 |
-
"\n",
|
1023 |
-
"model-00002-of-00003.safetensors: 80%|███████▉ | 3.97G/4.98G [01:11<00:15, 64.8MB/s]\u001b[A\u001b[A\n",
|
1024 |
-
"model-00001-of-00003.safetensors: 74%|███████▎ | 3.67G/4.98G [01:11<00:32, 40.7MB/s]\u001b[A\n",
|
1025 |
-
"model-00001-of-00003.safetensors: 74%|███████▍ | 3.70G/4.98G [01:11<00:21, 60.4MB/s]\u001b[A\n",
|
1026 |
-
"model-00001-of-00003.safetensors: 75%|███████▍ | 3.71G/4.98G [01:12<00:20, 61.7MB/s]\u001b[A\n",
|
1027 |
-
"\n",
|
1028 |
-
"model-00002-of-00003.safetensors: 80%|███████▉ | 3.98G/4.98G [01:11<00:19, 50.4MB/s]\u001b[A\u001b[A\n",
|
1029 |
-
"\n",
|
1030 |
-
"model-00002-of-00003.safetensors: 80%|████████ | 4.01G/4.98G [01:12<00:18, 52.7MB/s]\u001b[A\u001b[A\n",
|
1031 |
-
"model-00001-of-00003.safetensors: 75%|███████▍ | 3.72G/4.98G [01:12<00:30, 41.2MB/s]\u001b[A\n",
|
1032 |
-
"\n",
|
1033 |
-
"model-00002-of-00003.safetensors: 81%|████████ | 4.02G/4.98G [01:12<00:19, 48.9MB/s]\u001b[A\u001b[A\n",
|
1034 |
-
"model-00001-of-00003.safetensors: 75%|███████▍ | 3.73G/4.98G [01:12<00:32, 38.7MB/s]\u001b[A\n",
|
1035 |
-
"\n",
|
1036 |
-
"model-00002-of-00003.safetensors: 81%|████████ | 4.04G/4.98G [01:13<00:18, 49.8MB/s]\u001b[A\u001b[A\n",
|
1037 |
-
"model-00001-of-00003.safetensors: 75%|███████▌ | 3.75G/4.98G [01:13<00:23, 51.9MB/s]\u001b[A\n",
|
1038 |
-
"model-00001-of-00003.safetensors: 76%|███████▌ | 3.76G/4.98G [01:13<00:22, 55.1MB/s]\u001b[A\n",
|
1039 |
-
"\n",
|
1040 |
-
"model-00002-of-00003.safetensors: 81%|████████▏ | 4.06G/4.98G [01:13<00:15, 60.3MB/s]\u001b[A\u001b[A\n",
|
1041 |
-
"\n",
|
1042 |
-
"model-00002-of-00003.safetensors: 82%|████████▏ | 4.07G/4.98G [01:13<00:17, 52.9MB/s]\u001b[A\u001b[A\n",
|
1043 |
-
"model-00001-of-00003.safetensors: 76%|███████▌ | 3.79G/4.98G [01:13<00:20, 58.7MB/s]\u001b[A\n",
|
1044 |
-
"model-00001-of-00003.safetensors: 76%|███████▌ | 3.80G/4.98G [01:13<00:21, 55.7MB/s]\u001b[A\n",
|
1045 |
-
"\n",
|
1046 |
-
"model-00002-of-00003.safetensors: 82%|████████▏ | 4.09G/4.98G [01:13<00:14, 60.8MB/s]\u001b[A\u001b[A\n",
|
1047 |
-
"model-00001-of-00003.safetensors: 76%|███████▋ | 3.81G/4.98G [01:13<00:19, 60.4MB/s]\u001b[A\n",
|
1048 |
-
"model-00001-of-00003.safetensors: 77%|███████▋ | 3.82G/4.98G [01:14<00:18, 62.2MB/s]\u001b[A\n",
|
1049 |
-
"\n",
|
1050 |
-
"model-00002-of-00003.safetensors: 82%|████████▏ | 4.10G/4.98G [01:14<00:16, 54.3MB/s]\u001b[A\u001b[A\n",
|
1051 |
-
"\n",
|
1052 |
-
"model-00002-of-00003.safetensors: 83%|████████▎ | 4.12G/4.98G [01:14<00:13, 65.5MB/s]\u001b[A\u001b[A\n",
|
1053 |
-
"model-00001-of-00003.safetensors: 77%|███████▋ | 3.83G/4.98G [01:14<00:25, 45.1MB/s]\u001b[A\n",
|
1054 |
-
"\n",
|
1055 |
-
"model-00002-of-00003.safetensors: 83%|████████▎ | 4.13G/4.98G [01:14<00:17, 49.4MB/s]\u001b[A\u001b[A\n",
|
1056 |
-
"model-00001-of-00003.safetensors: 77%|███████▋ | 3.85G/4.98G [01:14<00:22, 51.0MB/s]\u001b[A\n",
|
1057 |
-
"\n",
|
1058 |
-
"model-00002-of-00003.safetensors: 83%|████████▎ | 4.14G/4.98G [01:14<00:16, 50.5MB/s]\u001b[A\u001b[A\n",
|
1059 |
-
"model-00001-of-00003.safetensors: 77%|███████▋ | 3.86G/4.98G [01:15<00:22, 50.4MB/s]\u001b[A\n",
|
1060 |
-
"\n",
|
1061 |
-
"model-00002-of-00003.safetensors: 83%|████████▎ | 4.15G/4.98G [01:15<00:15, 52.9MB/s]\u001b[A\u001b[A\n",
|
1062 |
-
"model-00001-of-00003.safetensors: 78%|███████▊ | 3.87G/4.98G [01:15<00:24, 46.1MB/s]\u001b[A\n",
|
1063 |
-
"\n",
|
1064 |
-
"model-00002-of-00003.safetensors: 84%|████████▎ | 4.16G/4.98G [01:15<00:17, 47.3MB/s]\u001b[A\u001b[A\n",
|
1065 |
-
"model-00001-of-00003.safetensors: 78%|███████▊ | 3.88G/4.98G [01:15<00:21, 51.0MB/s]\u001b[A\n",
|
1066 |
-
"\n",
|
1067 |
-
"model-00002-of-00003.safetensors: 84%|████████▍ | 4.18G/4.98G [01:15<00:12, 66.2MB/s]\u001b[A\u001b[A\n",
|
1068 |
-
"\n",
|
1069 |
-
"model-00002-of-00003.safetensors: 84%|████████▍ | 4.19G/4.98G [01:15<00:13, 56.7MB/s]\u001b[A\u001b[A\n",
|
1070 |
-
"model-00001-of-00003.safetensors: 78%|███████▊ | 3.89G/4.98G [01:15<00:24, 44.0MB/s]\u001b[A\n",
|
1071 |
-
"\n",
|
1072 |
-
"model-00002-of-00003.safetensors: 85%|████████▍ | 4.22G/4.98G [01:15<00:10, 73.9MB/s]\u001b[A\u001b[A\n",
|
1073 |
-
"model-00001-of-00003.safetensors: 79%|███████▊ | 3.91G/4.98G [01:16<00:19, 55.8MB/s]\u001b[A\n",
|
1074 |
-
"\n",
|
1075 |
-
"model-00002-of-00003.safetensors: 85%|████████▍ | 4.23G/4.98G [01:16<00:10, 70.7MB/s]\u001b[A\u001b[A\n",
|
1076 |
-
"model-00001-of-00003.safetensors: 79%|███████▊ | 3.92G/4.98G [01:16<00:20, 52.7MB/s]\u001b[A\n",
|
1077 |
-
"model-00001-of-00003.safetensors: 79%|███████▉ | 3.93G/4.98G [01:16<00:18, 56.4MB/s]\u001b[A\n",
|
1078 |
-
"model-00001-of-00003.safetensors: 79%|███████▉ | 3.94G/4.98G [01:16<00:19, 53.4MB/s]\u001b[A\n",
|
1079 |
-
"\n",
|
1080 |
-
"model-00002-of-00003.safetensors: 85%|████████▌ | 4.25G/4.98G [01:16<00:14, 51.4MB/s]\u001b[A\u001b[A\n",
|
1081 |
-
"model-00001-of-00003.safetensors: 79%|███████▉ | 3.95G/4.98G [01:16<00:19, 52.9MB/s]\u001b[A\n",
|
1082 |
-
"\n",
|
1083 |
-
"model-00002-of-00003.safetensors: 85%|████████▌ | 4.26G/4.98G [01:16<00:15, 45.7MB/s]\u001b[A\u001b[A\n",
|
1084 |
-
"model-00001-of-00003.safetensors: 80%|███████▉ | 3.97G/4.98G [01:17<00:18, 54.1MB/s]\u001b[A\n",
|
1085 |
-
"\n",
|
1086 |
-
"model-00002-of-00003.safetensors: 86%|████████▌ | 4.28G/4.98G [01:17<00:13, 50.8MB/s]\u001b[A\u001b[A\n",
|
1087 |
-
"model-00001-of-00003.safetensors: 80%|███████▉ | 3.98G/4.98G [01:17<00:17, 55.7MB/s]\u001b[A\n",
|
1088 |
-
"\n",
|
1089 |
-
"model-00002-of-00003.safetensors: 86%|████████▌ | 4.29G/4.98G [01:17<00:14, 48.0MB/s]\u001b[A\u001b[A\n",
|
1090 |
-
"model-00001-of-00003.safetensors: 80%|████████ | 4.01G/4.98G [01:17<00:14, 67.9MB/s]\u001b[A\n",
|
1091 |
-
"model-00001-of-00003.safetensors: 81%|████████ | 4.02G/4.98G [01:17<00:14, 64.8MB/s]\u001b[A\n",
|
1092 |
-
"\n",
|
1093 |
-
"model-00002-of-00003.safetensors: 86%|████████▋ | 4.31G/4.98G [01:18<00:13, 49.0MB/s]\u001b[A\u001b[A\n",
|
1094 |
-
"\n",
|
1095 |
-
"model-00002-of-00003.safetensors: 87%|████████▋ | 4.32G/4.98G [01:18<00:13, 49.3MB/s]\u001b[A\u001b[A\n",
|
1096 |
-
"model-00001-of-00003.safetensors: 81%|████████ | 4.04G/4.98G [01:18<00:17, 53.6MB/s]\u001b[A\n",
|
1097 |
-
"\n",
|
1098 |
-
"model-00002-of-00003.safetensors: 87%|████████▋ | 4.34G/4.98G [01:18<00:12, 49.4MB/s]\u001b[A\u001b[A\n",
|
1099 |
-
"model-00001-of-00003.safetensors: 81%|████████ | 4.05G/4.98G [01:18<00:20, 45.0MB/s]\u001b[A\n",
|
1100 |
-
"model-00001-of-00003.safetensors: 81%|████████▏ | 4.06G/4.98G [01:18<00:18, 49.4MB/s]\u001b[A\n",
|
1101 |
-
"\n",
|
1102 |
-
"model-00002-of-00003.safetensors: 88%|████████▊ | 4.36G/4.98G [01:18<00:11, 54.4MB/s]\u001b[A\u001b[A\n",
|
1103 |
-
"model-00001-of-00003.safetensors: 82%|████████▏ | 4.07G/4.98G [01:19<00:20, 44.6MB/s]\u001b[A\n",
|
1104 |
-
"\n",
|
1105 |
-
"model-00002-of-00003.safetensors: 88%|████████▊ | 4.37G/4.98G [01:19<00:12, 49.8MB/s]\u001b[A\u001b[A\n",
|
1106 |
-
"\n",
|
1107 |
-
"model-00002-of-00003.safetensors: 88%|████████▊ | 4.38G/4.98G [01:19<00:11, 52.3MB/s]\u001b[A\u001b[A\n",
|
1108 |
-
"model-00001-of-00003.safetensors: 82%|████████▏ | 4.09G/4.98G [01:19<00:20, 43.2MB/s]\u001b[A\n",
|
1109 |
-
"\n",
|
1110 |
-
"model-00002-of-00003.safetensors: 88%|████████▊ | 4.39G/4.98G [01:19<00:11, 51.8MB/s]\u001b[A\u001b[A\n",
|
1111 |
-
"\n",
|
1112 |
-
"model-00002-of-00003.safetensors: 88%|████████▊ | 4.40G/4.98G [01:19<00:11, 51.5MB/s]\u001b[A\u001b[A\n",
|
1113 |
-
"\n",
|
1114 |
-
"model-00002-of-00003.safetensors: 89%|████████▉ | 4.42G/4.98G [01:19<00:08, 67.1MB/s]\u001b[A\u001b[A\n",
|
1115 |
-
"model-00001-of-00003.safetensors: 82%|████████▏ | 4.10G/4.98G [01:20<00:23, 37.3MB/s]\u001b[A\n",
|
1116 |
-
"\n",
|
1117 |
-
"model-00002-of-00003.safetensors: 89%|████████▉ | 4.44G/4.98G [01:20<00:09, 58.4MB/s]\u001b[A\u001b[A\n",
|
1118 |
-
"\n",
|
1119 |
-
"model-00002-of-00003.safetensors: 89%|████████▉ | 4.46G/4.98G [01:20<00:07, 71.1MB/s]\u001b[A\u001b[A\n",
|
1120 |
-
"model-00001-of-00003.safetensors: 83%|████████▎ | 4.12G/4.98G [01:20<00:22, 39.0MB/s]\u001b[A\n",
|
1121 |
-
"\n",
|
1122 |
-
"model-00002-of-00003.safetensors: 90%|████████▉ | 4.47G/4.98G [01:20<00:07, 68.7MB/s]\u001b[A\u001b[A\n",
|
1123 |
-
"model-00001-of-00003.safetensors: 83%|████████▎ | 4.13G/4.98G [01:20<00:19, 42.9MB/s]\u001b[A\n",
|
1124 |
-
"\n",
|
1125 |
-
"model-00002-of-00003.safetensors: 90%|████████▉ | 4.48G/4.98G [01:20<00:06, 73.3MB/s]\u001b[A\u001b[A\n",
|
1126 |
-
"\n",
|
1127 |
-
"model-00002-of-00003.safetensors: 90%|█████████ | 4.49G/4.98G [01:20<00:07, 69.2MB/s]\u001b[A\u001b[A\n",
|
1128 |
-
"model-00001-of-00003.safetensors: 83%|████████▎ | 4.15G/4.98G [01:21<00:16, 50.1MB/s]\u001b[A\n",
|
1129 |
-
"\n",
|
1130 |
-
"model-00002-of-00003.safetensors: 90%|█████████ | 4.50G/4.98G [01:21<00:08, 56.6MB/s]\u001b[A\u001b[A\n",
|
1131 |
-
"model-00001-of-00003.safetensors: 84%|████████▎ | 4.16G/4.98G [01:21<00:16, 48.6MB/s]\u001b[A\n",
|
1132 |
-
"\n",
|
1133 |
-
"model-00002-of-00003.safetensors: 91%|█████████ | 4.52G/4.98G [01:21<00:07, 62.4MB/s]\u001b[A\u001b[A\n",
|
1134 |
-
"model-00001-of-00003.safetensors: 84%|████████▍ | 4.18G/4.98G [01:21<00:15, 52.0MB/s]\u001b[A\n",
|
1135 |
-
"\n",
|
1136 |
-
"model-00002-of-00003.safetensors: 91%|█████████ | 4.53G/4.98G [01:21<00:06, 68.4MB/s]\u001b[A\u001b[A\n",
|
1137 |
-
"model-00001-of-00003.safetensors: 84%|████████▍ | 4.19G/4.98G [01:21<00:14, 54.5MB/s]\u001b[A\n",
|
1138 |
-
"\n",
|
1139 |
-
"model-00002-of-00003.safetensors: 91%|█████████▏| 4.55G/4.98G [01:21<00:06, 68.6MB/s]\u001b[A\u001b[A\n",
|
1140 |
-
"\n",
|
1141 |
-
"model-00002-of-00003.safetensors: 92%|█████████▏| 4.56G/4.98G [01:22<00:06, 69.3MB/s]\u001b[A\u001b[A\n",
|
1142 |
-
"\n",
|
1143 |
-
"model-00002-of-00003.safetensors: 92%|█████████▏| 4.57G/4.98G [01:22<00:05, 72.9MB/s]\u001b[A\u001b[A\n",
|
1144 |
-
"model-00001-of-00003.safetensors: 85%|████████▍ | 4.22G/4.98G [01:22<00:16, 46.3MB/s]\u001b[A\n",
|
1145 |
-
"\n",
|
1146 |
-
"model-00002-of-00003.safetensors: 92%|█████████▏| 4.58G/4.98G [01:22<00:06, 66.7MB/s]\u001b[A\u001b[A\n",
|
1147 |
-
"\n",
|
1148 |
-
"model-00002-of-00003.safetensors: 92%|█████████▏| 4.59G/4.98G [01:22<00:05, 69.3MB/s]\u001b[A\u001b[A\n",
|
1149 |
-
"model-00001-of-00003.safetensors: 85%|████████▍ | 4.23G/4.98G [01:22<00:17, 42.2MB/s]\u001b[A\n",
|
1150 |
-
"\n",
|
1151 |
-
"model-00002-of-00003.safetensors: 93%|█████████▎| 4.61G/4.98G [01:22<00:05, 69.2MB/s]\u001b[A\u001b[A\n",
|
1152 |
-
"model-00001-of-00003.safetensors: 85%|████████▌ | 4.25G/4.98G [01:22<00:14, 51.6MB/s]\u001b[A\n",
|
1153 |
-
"\n",
|
1154 |
-
"model-00002-of-00003.safetensors: 93%|█████████▎| 4.62G/4.98G [01:22<00:05, 67.6MB/s]\u001b[A\u001b[A\n",
|
1155 |
-
"model-00001-of-00003.safetensors: 85%|████████▌ | 4.26G/4.98G [01:23<00:14, 50.4MB/s]\u001b[A\n",
|
1156 |
-
"\n",
|
1157 |
-
"model-00002-of-00003.safetensors: 93%|█████████▎| 4.65G/4.98G [01:23<00:04, 80.9MB/s]\u001b[A\u001b[A\n",
|
1158 |
-
"model-00001-of-00003.safetensors: 86%|████████▌ | 4.28G/4.98G [01:23<00:11, 63.1MB/s]\u001b[A\n",
|
1159 |
-
"\n",
|
1160 |
-
"model-00002-of-00003.safetensors: 94%|█████████▎| 4.67G/4.98G [01:23<00:03, 86.5MB/s]\u001b[A\u001b[A\n",
|
1161 |
-
"model-00001-of-00003.safetensors: 86%|████████▌ | 4.29G/4.98G [01:23<00:12, 55.3MB/s]\u001b[A\n",
|
1162 |
-
"\n",
|
1163 |
-
"model-00002-of-00003.safetensors: 94%|█████████▍| 4.68G/4.98G [01:23<00:04, 61.9MB/s]\u001b[A\u001b[A\n",
|
1164 |
-
"model-00001-of-00003.safetensors: 86%|████████▋ | 4.31G/4.98G [01:23<00:10, 65.8MB/s]\u001b[A\n",
|
1165 |
-
"\n",
|
1166 |
-
"model-00002-of-00003.safetensors: 94%|█████████▍| 4.69G/4.98G [01:23<00:04, 61.9MB/s]\u001b[A\u001b[A\n",
|
1167 |
-
"\n",
|
1168 |
-
"model-00002-of-00003.safetensors: 94%|█████████▍| 4.70G/4.98G [01:24<00:04, 62.7MB/s]\u001b[A\u001b[A\n",
|
1169 |
-
"model-00001-of-00003.safetensors: 87%|████████▋ | 4.32G/4.98G [01:24<00:12, 54.2MB/s]\u001b[A\n",
|
1170 |
-
"model-00001-of-00003.safetensors: 87%|████████▋ | 4.34G/4.98G [01:24<00:10, 61.2MB/s]\u001b[A\n",
|
1171 |
-
"\n",
|
1172 |
-
"model-00002-of-00003.safetensors: 94%|█████████▍| 4.71G/4.98G [01:24<00:06, 43.7MB/s]\u001b[A\u001b[A\n",
|
1173 |
-
"model-00001-of-00003.safetensors: 87%|████████▋ | 4.35G/4.98G [01:24<00:10, 57.4MB/s]\u001b[A\n",
|
1174 |
-
"model-00001-of-00003.safetensors: 88%|████████▊ | 4.36G/4.98G [01:24<00:10, 61.0MB/s]\u001b[A\n",
|
1175 |
-
"\n",
|
1176 |
-
"model-00002-of-00003.safetensors: 95%|█████████▍| 4.73G/4.98G [01:24<00:05, 47.1MB/s]\u001b[A\u001b[A\n",
|
1177 |
-
"model-00001-of-00003.safetensors: 88%|████████▊ | 4.37G/4.98G [01:25<00:10, 56.1MB/s]\u001b[A\n",
|
1178 |
-
"\n",
|
1179 |
-
"model-00002-of-00003.safetensors: 95%|█████████▌| 4.74G/4.98G [01:25<00:05, 42.0MB/s]\u001b[A\u001b[A\n",
|
1180 |
-
"model-00001-of-00003.safetensors: 88%|████████▊ | 4.38G/4.98G [01:25<00:13, 44.1MB/s]\u001b[A\n",
|
1181 |
-
"\n",
|
1182 |
-
"model-00002-of-00003.safetensors: 95%|█████████▌| 4.75G/4.98G [01:25<00:05, 44.7MB/s]\u001b[A\u001b[A\n",
|
1183 |
-
"model-00001-of-00003.safetensors: 88%|████████▊ | 4.39G/4.98G [01:25<00:12, 47.3MB/s]\u001b[A\n",
|
1184 |
-
"\n",
|
1185 |
-
"model-00002-of-00003.safetensors: 96%|█████████▌| 4.76G/4.98G [01:25<00:04, 44.8MB/s]\u001b[A\u001b[A\n",
|
1186 |
-
"model-00001-of-00003.safetensors: 88%|████████▊ | 4.40G/4.98G [01:25<00:12, 45.0MB/s]\u001b[A\n",
|
1187 |
-
"\n",
|
1188 |
-
"model-00002-of-00003.safetensors: 96%|█████████▌| 4.77G/4.98G [01:25<00:04, 45.1MB/s]\u001b[A\u001b[A\n",
|
1189 |
-
"\n",
|
1190 |
-
"model-00002-of-00003.safetensors: 96%|█████████▌| 4.79G/4.98G [01:26<00:03, 58.4MB/s]\u001b[A\u001b[A\n",
|
1191 |
-
"model-00001-of-00003.safetensors: 89%|████████▉ | 4.42G/4.98G [01:26<00:12, 44.8MB/s]\u001b[A\n",
|
1192 |
-
"\n",
|
1193 |
-
"model-00002-of-00003.safetensors: 96%|█████████▋| 4.80G/4.98G [01:26<00:03, 50.2MB/s]\u001b[A\u001b[A\n",
|
1194 |
-
"model-00001-of-00003.safetensors: 89%|████████▉ | 4.44G/4.98G [01:26<00:11, 48.7MB/s]\u001b[A\n",
|
1195 |
-
"\n",
|
1196 |
-
"model-00002-of-00003.safetensors: 97%|█████████▋| 4.81G/4.98G [01:26<00:03, 55.1MB/s]\u001b[A\u001b[A\n",
|
1197 |
-
"\n",
|
1198 |
-
"model-00002-of-00003.safetensors: 97%|█████████▋| 4.82G/4.98G [01:26<00:02, 60.6MB/s]\u001b[A\u001b[A\n",
|
1199 |
-
"model-00001-of-00003.safetensors: 89%|████████▉ | 4.46G/4.98G [01:26<00:10, 50.0MB/s]\u001b[A\n",
|
1200 |
-
"\n",
|
1201 |
-
"model-00002-of-00003.safetensors: 97%|█████████▋| 4.83G/4.98G [01:26<00:02, 50.3MB/s]\u001b[A\u001b[A\n",
|
1202 |
-
"model-00001-of-00003.safetensors: 90%|████████▉ | 4.47G/4.98G [01:27<00:11, 45.4MB/s]\u001b[A\n",
|
1203 |
-
"\n",
|
1204 |
-
"model-00002-of-00003.safetensors: 97%|█████████▋| 4.85G/4.98G [01:27<00:02, 61.7MB/s]\u001b[A\u001b[A\n",
|
1205 |
-
"\n",
|
1206 |
-
"model-00002-of-00003.safetensors: 98%|█████████▊| 4.87G/4.98G [01:27<00:01, 64.6MB/s]\u001b[A\u001b[A\n",
|
1207 |
-
"model-00001-of-00003.safetensors: 90%|█████████ | 4.49G/4.98G [01:27<00:08, 56.3MB/s]\u001b[A\n",
|
1208 |
-
"\n",
|
1209 |
-
"model-00002-of-00003.safetensors: 98%|█████████▊| 4.89G/4.98G [01:27<00:01, 75.8MB/s]\u001b[A\u001b[A\n",
|
1210 |
-
"\n",
|
1211 |
-
"model-00002-of-00003.safetensors: 98%|█████████▊| 4.90G/4.98G [01:27<00:01, 65.1MB/s]\u001b[A\u001b[A\n",
|
1212 |
-
"model-00001-of-00003.safetensors: 90%|█████████ | 4.50G/4.98G [01:27<00:11, 41.5MB/s]\u001b[A\n",
|
1213 |
-
"model-00001-of-00003.safetensors: 91%|█████████ | 4.52G/4.98G [01:28<00:08, 56.4MB/s]\u001b[A\n",
|
1214 |
-
"\n",
|
1215 |
-
"model-00002-of-00003.safetensors: 99%|█████████▊| 4.92G/4.98G [01:28<00:00, 67.9MB/s]\u001b[A\u001b[A\n",
|
1216 |
-
"model-00001-of-00003.safetensors: 91%|█████████ | 4.53G/4.98G [01:28<00:07, 57.4MB/s]\u001b[A\n",
|
1217 |
-
"model-00001-of-00003.safetensors: 91%|█████████▏| 4.55G/4.98G [01:28<00:05, 72.4MB/s]\u001b[A\n",
|
1218 |
-
"\n",
|
1219 |
-
"model-00002-of-00003.safetensors: 99%|█████████▉| 4.93G/4.98G [01:28<00:00, 54.6MB/s]\u001b[A\u001b[A\n",
|
1220 |
-
"model-00001-of-00003.safetensors: 92%|█████████▏| 4.56G/4.98G [01:28<00:05, 73.0MB/s]\u001b[A\n",
|
1221 |
-
"\n",
|
1222 |
-
"model-00002-of-00003.safetensors: 99%|█████████▉| 4.95G/4.98G [01:28<00:00, 63.3MB/s]\u001b[A\u001b[A\n",
|
1223 |
-
"model-00001-of-00003.safetensors: 92%|█████████▏| 4.58G/4.98G [01:28<00:04, 80.1MB/s]\u001b[A\n",
|
1224 |
-
"\n",
|
1225 |
-
"model-00002-of-00003.safetensors: 100%|█████████▉| 4.96G/4.98G [01:28<00:00, 63.9MB/s]\u001b[A\u001b[A\n",
|
1226 |
-
"\n",
|
1227 |
-
"model-00002-of-00003.safetensors: 100%|█████████▉| 4.97G/4.98G [01:29<00:00, 59.7MB/s]\u001b[A\u001b[A\n",
|
1228 |
-
"model-00001-of-00003.safetensors: 92%|█████████▏| 4.59G/4.98G [01:29<00:06, 59.6MB/s]\u001b[A\n",
|
1229 |
-
"\n",
|
1230 |
-
"model-00002-of-00003.safetensors: 100%|██████████| 4.98G/4.98G [01:29<00:00, 55.9MB/s]\u001b[A\u001b[A\n",
|
1231 |
-
"\n",
|
1232 |
-
"model-00001-of-00003.safetensors: 93%|█████████▎| 4.61G/4.98G [01:29<00:05, 62.2MB/s]\u001b[A\n",
|
1233 |
-
"model-00001-of-00003.safetensors: 93%|█████████▎| 4.62G/4.98G [01:29<00:06, 57.7MB/s]\u001b[A\n",
|
1234 |
-
"model-00001-of-00003.safetensors: 93%|█████████▎| 4.65G/4.98G [01:29<00:05, 65.2MB/s]\u001b[A\n",
|
1235 |
-
"model-00001-of-00003.safetensors: 93%|█████████▎| 4.66G/4.98G [01:30<00:05, 64.6MB/s]\u001b[A\n",
|
1236 |
-
"model-00001-of-00003.safetensors: 94%|█████████▎| 4.67G/4.98G [01:30<00:04, 65.1MB/s]\u001b[A\n",
|
1237 |
-
"model-00001-of-00003.safetensors: 94%|█████████▍| 4.68G/4.98G [01:30<00:05, 60.3MB/s]\u001b[A\n",
|
1238 |
-
"model-00001-of-00003.safetensors: 94%|█████████▍| 4.70G/4.98G [01:30<00:04, 60.8MB/s]\u001b[A\n",
|
1239 |
-
"model-00001-of-00003.safetensors: 94%|█████████▍| 4.71G/4.98G [01:30<00:04, 62.1MB/s]\u001b[A\n",
|
1240 |
-
"model-00001-of-00003.safetensors: 95%|█████████▍| 4.73G/4.98G [01:31<00:03, 73.0MB/s]\u001b[A\n",
|
1241 |
-
"model-00001-of-00003.safetensors: 95%|█████████▌| 4.74G/4.98G [01:31<00:03, 75.3MB/s]\u001b[A\n",
|
1242 |
-
"model-00001-of-00003.safetensors: 96%|█████████▌| 4.76G/4.98G [01:31<00:02, 85.7MB/s]\u001b[A\n",
|
1243 |
-
"model-00001-of-00003.safetensors: 96%|█████████▌| 4.77G/4.98G [01:31<00:03, 60.2MB/s]\u001b[A\n",
|
1244 |
-
"model-00001-of-00003.safetensors: 96%|█████████▌| 4.78G/4.98G [01:32<00:03, 52.4MB/s]\u001b[A\n",
|
1245 |
-
"model-00001-of-00003.safetensors: 96%|█████████▌| 4.79G/4.98G [01:32<00:03, 56.1MB/s]\u001b[A\n",
|
1246 |
-
"model-00001-of-00003.safetensors: 96%|█████████▋| 4.80G/4.98G [01:32<00:04, 44.7MB/s]\u001b[A\n",
|
1247 |
-
"model-00001-of-00003.safetensors: 97%|█████████▋| 4.82G/4.98G [01:32<00:02, 58.1MB/s]\u001b[A\n",
|
1248 |
-
"model-00001-of-00003.safetensors: 97%|█████████▋| 4.83G/4.98G [01:33<00:02, 54.4MB/s]\u001b[A\n",
|
1249 |
-
"model-00001-of-00003.safetensors: 97%|█████████▋| 4.85G/4.98G [01:33<00:02, 51.5MB/s]\u001b[A\n",
|
1250 |
-
"model-00001-of-00003.safetensors: 98%|█████████▊| 4.87G/4.98G [01:33<00:02, 44.7MB/s]\u001b[A\n",
|
1251 |
-
"model-00001-of-00003.safetensors: 98%|█████████▊| 4.88G/4.98G [01:34<00:02, 45.1MB/s]\u001b[A\n",
|
1252 |
-
"model-00001-of-00003.safetensors: 98%|█████████▊| 4.89G/4.98G [01:34<00:01, 52.4MB/s]\u001b[A\n",
|
1253 |
-
"model-00001-of-00003.safetensors: 98%|█████████▊| 4.90G/4.98G [01:34<00:01, 55.3MB/s]\u001b[A\n",
|
1254 |
-
"model-00001-of-00003.safetensors: 98%|█████████▊| 4.91G/4.98G [01:34<00:01, 57.0MB/s]\u001b[A\n",
|
1255 |
-
"model-00001-of-00003.safetensors: 99%|█████████▊| 4.92G/4.98G [01:34<00:01, 57.2MB/s]\u001b[A\n",
|
1256 |
-
"model-00001-of-00003.safetensors: 99%|█████████▉| 4.93G/4.98G [01:34<00:00, 57.8MB/s]\u001b[A\n",
|
1257 |
-
"model-00001-of-00003.safetensors: 99%|█████████▉| 4.95G/4.98G [01:35<00:00, 67.6MB/s]\u001b[A\n",
|
1258 |
-
"model-00001-of-00003.safetensors: 100%|█████████▉| 4.96G/4.98G [01:35<00:00, 69.8MB/s]\u001b[A\n",
|
1259 |
-
"model-00001-of-00003.safetensors: 100%|█████████▉| 4.97G/4.98G [01:35<00:00, 64.0MB/s]\u001b[A\n",
|
1260 |
-
"model-00001-of-00003.safetensors: 100%|██████████| 4.98G/4.98G [01:35<00:00, 52.0MB/s]\u001b[A\n"
|
1261 |
]
|
1262 |
},
|
1263 |
{
|
1264 |
"ename": "KeyError",
|
1265 |
-
"evalue": "'base_model.model.
|
1266 |
"output_type": "error",
|
1267 |
"traceback": [
|
1268 |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
1269 |
"\u001b[0;31mKeyError\u001b[0m Traceback (most recent call last)",
|
1270 |
-
"Cell \u001b[0;32mIn[
|
1271 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/entrypoints/llm.py:109\u001b[0m, in \u001b[0;36mLLM.__init__\u001b[0;34m(self, model, tokenizer, tokenizer_mode, trust_remote_code, tensor_parallel_size, dtype, quantization, revision, tokenizer_revision, seed, gpu_memory_utilization, swap_space, enforce_eager, max_context_len_to_capture, disable_custom_all_reduce, **kwargs)\u001b[0m\n\u001b[1;32m 90\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdisable_log_stats\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 91\u001b[0m engine_args \u001b[38;5;241m=\u001b[39m EngineArgs(\n\u001b[1;32m 92\u001b[0m model\u001b[38;5;241m=\u001b[39mmodel,\n\u001b[1;32m 93\u001b[0m tokenizer\u001b[38;5;241m=\u001b[39mtokenizer,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 107\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[1;32m 108\u001b[0m )\n\u001b[0;32m--> 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mllm_engine \u001b[38;5;241m=\u001b[39m \u001b[43mLLMEngine\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfrom_engine_args\u001b[49m\u001b[43m(\u001b[49m\u001b[43mengine_args\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mrequest_counter \u001b[38;5;241m=\u001b[39m Counter()\n",
|
1272 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:356\u001b[0m, in \u001b[0;36mLLMEngine.from_engine_args\u001b[0;34m(cls, engine_args)\u001b[0m\n\u001b[1;32m 354\u001b[0m placement_group \u001b[38;5;241m=\u001b[39m initialize_cluster(parallel_config)\n\u001b[1;32m 355\u001b[0m \u001b[38;5;66;03m# Create the LLM engine.\u001b[39;00m\n\u001b[0;32m--> 356\u001b[0m engine \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mcls\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mengine_configs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 357\u001b[0m \u001b[43m \u001b[49m\u001b[43mplacement_group\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 358\u001b[0m \u001b[43m \u001b[49m\u001b[43mlog_stats\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mengine_args\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdisable_log_stats\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 359\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m engine\n",
|
1273 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:111\u001b[0m, in \u001b[0;36mLLMEngine.__init__\u001b[0;34m(self, model_config, cache_config, parallel_config, scheduler_config, lora_config, placement_group, log_stats)\u001b[0m\n\u001b[1;32m 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_workers_ray(placement_group)\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 111\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_init_workers\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 113\u001b[0m \u001b[38;5;66;03m# Profile the memory usage and initialize the cache.\u001b[39;00m\n\u001b[1;32m 114\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_cache()\n",
|
@@ -1276,8 +283,8 @@
|
|
1276 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/worker.py:92\u001b[0m, in \u001b[0;36mWorker.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m):\n\u001b[0;32m---> 92\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_runner\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_model\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
|
1277 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/model_runner.py:75\u001b[0m, in \u001b[0;36mModelRunner.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m---> 75\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;241m=\u001b[39m \u001b[43mget_model\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_config\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlora_config\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 77\u001b[0m vocab_size \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mconfig\u001b[38;5;241m.\u001b[39mvocab_size\n\u001b[1;32m 79\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlora_config:\n",
|
1278 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/model_loader.py:88\u001b[0m, in \u001b[0;36mget_model\u001b[0;34m(model_config, lora_config)\u001b[0m\n\u001b[1;32m 85\u001b[0m initialize_dummy_weights(model)\n\u001b[1;32m 86\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 87\u001b[0m \u001b[38;5;66;03m# Load the weights from the cached or downloaded files.\u001b[39;00m\n\u001b[0;32m---> 88\u001b[0m \u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_weights\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_dir\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 89\u001b[0m \u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_format\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrevision\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 90\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m model\u001b[38;5;241m.\u001b[39meval()\n",
|
1279 |
-
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/models/phi.py:
|
1280 |
-
"\u001b[0;31mKeyError\u001b[0m: 'base_model.model.
|
1281 |
]
|
1282 |
}
|
1283 |
],
|
|
|
225 |
},
|
226 |
{
|
227 |
"cell_type": "code",
|
228 |
+
"execution_count": 5,
|
229 |
"id": "75a61ec8-e440-42b0-8b4d-e3cb05841b71",
|
230 |
"metadata": {},
|
231 |
+
"outputs": [],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
232 |
"source": [
|
233 |
"import torch\n",
|
234 |
"import numpy as np\n",
|
|
|
240 |
},
|
241 |
{
|
242 |
"cell_type": "code",
|
243 |
+
"execution_count": 7,
|
244 |
"id": "7d29ba48-d4b0-4f24-8f88-560d9bed100c",
|
245 |
"metadata": {
|
246 |
"scrolled": true
|
247 |
},
|
248 |
"outputs": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
249 |
{
|
250 |
"name": "stdout",
|
251 |
"output_type": "stream",
|
252 |
"text": [
|
253 |
+
"INFO 02-15 18:03:33 llm_engine.py:72] Initializing an LLM engine with config: model='aissatoubalde/lab', tokenizer='microsoft/phi-2', tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.float16, max_seq_len=2048, download_dir=None, load_format=auto, tensor_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=False, kv_cache_dtype=auto, seed=0)\n"
|
254 |
]
|
255 |
},
|
256 |
{
|
257 |
"name": "stderr",
|
258 |
"output_type": "stream",
|
259 |
"text": [
|
|
|
260 |
"Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
|
261 |
]
|
262 |
},
|
|
|
264 |
"name": "stdout",
|
265 |
"output_type": "stream",
|
266 |
"text": [
|
267 |
+
"INFO 02-15 18:03:33 weight_utils.py:164] Using model weights format ['*.safetensors']\n"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
268 |
]
|
269 |
},
|
270 |
{
|
271 |
"ename": "KeyError",
|
272 |
+
"evalue": "'base_model.model.model.layers.0.mlp.fc1.lora_A.weight'",
|
273 |
"output_type": "error",
|
274 |
"traceback": [
|
275 |
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
276 |
"\u001b[0;31mKeyError\u001b[0m Traceback (most recent call last)",
|
277 |
+
"Cell \u001b[0;32mIn[7], line 4\u001b[0m\n\u001b[1;32m 2\u001b[0m base_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmicrosoft/phi-2\u001b[39m\u001b[38;5;124m'\u001b[39m\n\u001b[1;32m 3\u001b[0m merged_peft_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124maissatoubalde/lab\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m----> 4\u001b[0m llm \u001b[38;5;241m=\u001b[39m \u001b[43mLLM\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mmerged_peft_model_name\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtokenizer\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbase_model_name\u001b[49m\u001b[43m)\u001b[49m\n",
|
278 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/entrypoints/llm.py:109\u001b[0m, in \u001b[0;36mLLM.__init__\u001b[0;34m(self, model, tokenizer, tokenizer_mode, trust_remote_code, tensor_parallel_size, dtype, quantization, revision, tokenizer_revision, seed, gpu_memory_utilization, swap_space, enforce_eager, max_context_len_to_capture, disable_custom_all_reduce, **kwargs)\u001b[0m\n\u001b[1;32m 90\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdisable_log_stats\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 91\u001b[0m engine_args \u001b[38;5;241m=\u001b[39m EngineArgs(\n\u001b[1;32m 92\u001b[0m model\u001b[38;5;241m=\u001b[39mmodel,\n\u001b[1;32m 93\u001b[0m tokenizer\u001b[38;5;241m=\u001b[39mtokenizer,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 107\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[1;32m 108\u001b[0m )\n\u001b[0;32m--> 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mllm_engine \u001b[38;5;241m=\u001b[39m \u001b[43mLLMEngine\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfrom_engine_args\u001b[49m\u001b[43m(\u001b[49m\u001b[43mengine_args\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mrequest_counter \u001b[38;5;241m=\u001b[39m Counter()\n",
|
279 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:356\u001b[0m, in \u001b[0;36mLLMEngine.from_engine_args\u001b[0;34m(cls, engine_args)\u001b[0m\n\u001b[1;32m 354\u001b[0m placement_group \u001b[38;5;241m=\u001b[39m initialize_cluster(parallel_config)\n\u001b[1;32m 355\u001b[0m \u001b[38;5;66;03m# Create the LLM engine.\u001b[39;00m\n\u001b[0;32m--> 356\u001b[0m engine \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mcls\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mengine_configs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 357\u001b[0m \u001b[43m \u001b[49m\u001b[43mplacement_group\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 358\u001b[0m \u001b[43m \u001b[49m\u001b[43mlog_stats\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mengine_args\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdisable_log_stats\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 359\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m engine\n",
|
280 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:111\u001b[0m, in \u001b[0;36mLLMEngine.__init__\u001b[0;34m(self, model_config, cache_config, parallel_config, scheduler_config, lora_config, placement_group, log_stats)\u001b[0m\n\u001b[1;32m 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_workers_ray(placement_group)\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 111\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_init_workers\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 113\u001b[0m \u001b[38;5;66;03m# Profile the memory usage and initialize the cache.\u001b[39;00m\n\u001b[1;32m 114\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_cache()\n",
|
|
|
283 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/worker.py:92\u001b[0m, in \u001b[0;36mWorker.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m):\n\u001b[0;32m---> 92\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_runner\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_model\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
|
284 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/model_runner.py:75\u001b[0m, in \u001b[0;36mModelRunner.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m---> 75\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;241m=\u001b[39m \u001b[43mget_model\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_config\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlora_config\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 77\u001b[0m vocab_size \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mconfig\u001b[38;5;241m.\u001b[39mvocab_size\n\u001b[1;32m 79\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlora_config:\n",
|
285 |
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/model_loader.py:88\u001b[0m, in \u001b[0;36mget_model\u001b[0;34m(model_config, lora_config)\u001b[0m\n\u001b[1;32m 85\u001b[0m initialize_dummy_weights(model)\n\u001b[1;32m 86\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 87\u001b[0m \u001b[38;5;66;03m# Load the weights from the cached or downloaded files.\u001b[39;00m\n\u001b[0;32m---> 88\u001b[0m \u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_weights\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_dir\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 89\u001b[0m \u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_format\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrevision\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 90\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m model\u001b[38;5;241m.\u001b[39meval()\n",
|
286 |
+
"File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/models/phi.py:302\u001b[0m, in \u001b[0;36mPhiForCausalLM.load_weights\u001b[0;34m(self, model_name_or_path, cache_dir, load_format, revision)\u001b[0m\n\u001b[1;32m 299\u001b[0m \u001b[38;5;28;01mcontinue\u001b[39;00m\n\u001b[1;32m 300\u001b[0m \u001b[38;5;66;03m# pylint: disable=E1136\u001b[39;00m\n\u001b[0;32m--> 302\u001b[0m param \u001b[38;5;241m=\u001b[39m \u001b[43mparams_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[43mname\u001b[49m\u001b[43m]\u001b[49m\n\u001b[1;32m 303\u001b[0m weight_loader \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mgetattr\u001b[39m(param, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mweight_loader\u001b[39m\u001b[38;5;124m\"\u001b[39m,\n\u001b[1;32m 304\u001b[0m default_weight_loader)\n\u001b[1;32m 305\u001b[0m weight_loader(param, loaded_weight)\n",
|
287 |
+
"\u001b[0;31mKeyError\u001b[0m: 'base_model.model.model.layers.0.mlp.fc1.lora_A.weight'"
|
288 |
]
|
289 |
}
|
290 |
],
|
phi-2-custom.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4664
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b6c071b2811955d6107874169c939219fa3eadea899cc5d22b1dfc67183f694
|
3 |
size 4664
|