aissatoubalde commited on
Commit
fe490e0
1 Parent(s): cc55646

Training in progress, epoch 0

Browse files
.ipynb_checkpoints/phi-2-custom-checkpoint.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
adapter_config.json CHANGED
@@ -18,6 +18,12 @@
18
  "r": 16,
19
  "rank_pattern": {},
20
  "revision": null,
 
 
 
 
 
 
21
  "task_type": "CAUSAL_LM",
22
  "use_rslora": false
23
  }
 
18
  "r": 16,
19
  "rank_pattern": {},
20
  "revision": null,
21
+ "target_modules": [
22
+ "fc2",
23
+ "fc1",
24
+ "v_proj",
25
+ "q_proj"
26
+ ],
27
  "task_type": "CAUSAL_LM",
28
  "use_rslora": false
29
  }
fine-tuned-phi2.ipynb CHANGED
@@ -225,20 +225,10 @@
225
  },
226
  {
227
  "cell_type": "code",
228
- "execution_count": 3,
229
  "id": "75a61ec8-e440-42b0-8b4d-e3cb05841b71",
230
  "metadata": {},
231
- "outputs": [
232
- {
233
- "name": "stderr",
234
- "output_type": "stream",
235
- "text": [
236
- "/usr/local/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
237
- " from .autonotebook import tqdm as notebook_tqdm\n",
238
- "2024-02-15 17:38:51,139\tINFO util.py:154 -- Missing packages: ['ipywidgets']. Run `pip install -U ipywidgets`, then restart the notebook server for rich notebook output.\n"
239
- ]
240
- }
241
- ],
242
  "source": [
243
  "import torch\n",
244
  "import numpy as np\n",
@@ -250,31 +240,23 @@
250
  },
251
  {
252
  "cell_type": "code",
253
- "execution_count": 4,
254
  "id": "7d29ba48-d4b0-4f24-8f88-560d9bed100c",
255
  "metadata": {
256
  "scrolled": true
257
  },
258
  "outputs": [
259
- {
260
- "name": "stderr",
261
- "output_type": "stream",
262
- "text": [
263
- "config.json: 100%|██████████| 897/897 [00:00<00:00, 6.40MB/s]"
264
- ]
265
- },
266
  {
267
  "name": "stdout",
268
  "output_type": "stream",
269
  "text": [
270
- "INFO 02-15 17:39:03 llm_engine.py:72] Initializing an LLM engine with config: model='aissatoubalde/lab', tokenizer='microsoft/phi-2', tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.float16, max_seq_len=2048, download_dir=None, load_format=auto, tensor_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=False, kv_cache_dtype=auto, seed=0)\n"
271
  ]
272
  },
273
  {
274
  "name": "stderr",
275
  "output_type": "stream",
276
  "text": [
277
- "\n",
278
  "Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
279
  ]
280
  },
@@ -282,992 +264,17 @@
282
  "name": "stdout",
283
  "output_type": "stream",
284
  "text": [
285
- "INFO 02-15 17:39:05 weight_utils.py:164] Using model weights format ['*.safetensors']\n"
286
- ]
287
- },
288
- {
289
- "name": "stderr",
290
- "output_type": "stream",
291
- "text": [
292
- "model-00003-of-00003.safetensors: 0%| | 0.00/1.15G [00:00<?, ?B/s]\n",
293
- "model-00001-of-00003.safetensors: 0%| | 0.00/4.98G [00:00<?, ?B/s]\u001b[A\n",
294
- "\n",
295
- "model-00003-of-00003.safetensors: 2%|▏ | 21.0M/1.15G [00:00<00:13, 82.8MB/s]\n",
296
- "model-00001-of-00003.safetensors: 0%| | 21.0M/4.98G [00:00<01:01, 80.2MB/s]\u001b[A\n",
297
- "\n",
298
- "model-00003-of-00003.safetensors: 4%|▎ | 41.9M/1.15G [00:00<00:09, 112MB/s] \u001b[A\u001b[A\n",
299
- "\n",
300
- "model-00002-of-00003.safetensors: 1%| | 31.5M/4.98G [00:00<00:56, 87.1MB/s]\u001b[A\u001b[A\n",
301
- "model-00001-of-00003.safetensors: 1%| | 41.9M/4.98G [00:00<00:55, 89.8MB/s]\u001b[A\n",
302
- "\n",
303
- "model-00002-of-00003.safetensors: 1%| | 41.9M/4.98G [00:00<01:03, 78.0MB/s]\u001b[A\u001b[A\n",
304
- "\n",
305
- "model-00002-of-00003.safetensors: 1%| | 52.4M/4.98G [00:00<00:59, 82.3MB/s]\u001b[A\u001b[A\n",
306
- "model-00001-of-00003.safetensors: 1%| | 52.4M/4.98G [00:00<01:24, 58.1MB/s]\u001b[A\n",
307
- "\n",
308
- "model-00002-of-00003.safetensors: 1%|▏ | 73.4M/4.98G [00:00<00:59, 82.0MB/s]\u001b[A\u001b[A\n",
309
- "model-00001-of-00003.safetensors: 1%|▏ | 73.4M/4.98G [00:01<01:16, 64.0MB/s]\u001b[A\n",
310
- "\n",
311
- "model-00003-of-00003.safetensors: 5%|▌ | 62.9M/1.15G [00:01<00:25, 43.0MB/s]\u001b[A\u001b[A\n",
312
- "model-00001-of-00003.safetensors: 2%|▏ | 83.9M/4.98G [00:01<01:22, 59.1MB/s]\u001b[A\n",
313
- "\n",
314
- "model-00003-of-00003.safetensors: 6%|▋ | 73.4M/1.15G [00:01<00:23, 46.8MB/s]\u001b[A\u001b[A\n",
315
- "model-00001-of-00003.safetensors: 2%|▏ | 94.4M/4.98G [00:01<01:19, 61.3MB/s]\u001b[A\n",
316
- "\n",
317
- "model-00002-of-00003.safetensors: 2%|▏ | 115M/4.98G [00:01<01:00, 79.9MB/s]\u001b[A\u001b[A\n",
318
- "model-00001-of-00003.safetensors: 2%|▏ | 105M/4.98G [00:01<01:21, 60.1MB/s] \u001b[A\n",
319
- "\n",
320
- "model-00002-of-00003.safetensors: 3%|▎ | 136M/4.98G [00:01<01:06, 72.9MB/s]\u001b[A\u001b[A\n",
321
- "model-00003-of-00003.safetensors: 7%|▋ | 83.9M/1.15G [00:01<00:29, 35.7MB/s][A\n",
322
- "\n",
323
- "model-00002-of-00003.safetensors: 3%|▎ | 147M/4.98G [00:01<01:09, 69.6MB/s]\u001b[A\u001b[A\n",
324
- "model-00001-of-00003.safetensors: 3%|▎ | 136M/4.98G [00:02<01:18, 61.6MB/s]\u001b[A\n",
325
- "\n",
326
- "model-00003-of-00003.safetensors: 8%|▊ | 94.4M/1.15G [00:02<00:35, 29.9MB/s][A\u001b[A\n",
327
- "model-00003-of-00003.safetensors: 9%|▉ | 105M/1.15G [00:02<00:29, 35.8MB/s] [A\n",
328
- "\n",
329
- "model-00003-of-00003.safetensors: 10%|▉ | 115M/1.15G [00:02<00:25, 41.5MB/s]\u001b[A\u001b[A\n",
330
- "model-00001-of-00003.safetensors: 3%|▎ | 168M/4.98G [00:02<01:18, 61.4MB/s]\u001b[A\n",
331
- "\n",
332
- "model-00002-of-00003.safetensors: 4%|▍ | 199M/4.98G [00:02<01:12, 65.8MB/s]\u001b[A\u001b[A\n",
333
- "model-00001-of-00003.safetensors: 4%|▎ | 178M/4.98G [00:02<01:19, 60.5MB/s]\u001b[A\n",
334
- "\n",
335
- "model-00002-of-00003.safetensors: 4%|▍ | 210M/4.98G [00:02<01:09, 68.7MB/s]\u001b[A\u001b[A\n",
336
- "model-00001-of-00003.safetensors: 4%|▍ | 199M/4.98G [00:03<01:11, 67.0MB/s]\u001b[A\n",
337
- "\n",
338
- "model-00002-of-00003.safetensors: 5%|▍ | 231M/4.98G [00:03<01:00, 78.9MB/s]\u001b[A\u001b[A\n",
339
- "\n",
340
- "model-00003-of-00003.safetensors: 12%|█▏ | 136M/1.15G [00:03<00:27, 37.0MB/s]\u001b[A\u001b[A\n",
341
- "model-00003-of-00003.safetensors: 13%|█▎ | 147M/1.15G [00:03<00:26, 37.7MB/s]\u001b[A\n",
342
- "model-00003-of-00003.safetensors: 15%|█▍ | 168M/1.15G [00:03<00:19, 51.6MB/s]\u001b[A\n",
343
- "\n",
344
- "model-00002-of-00003.safetensors: 5%|▌ | 262M/4.98G [00:03<01:26, 54.9MB/s]\u001b[A\u001b[A\n",
345
- "model-00001-of-00003.safetensors: 5%|▍ | 231M/4.98G [00:03<01:41, 46.6MB/s]\u001b[A\n",
346
- "\n",
347
- "model-00002-of-00003.safetensors: 5%|▌ | 273M/4.98G [00:04<01:28, 53.1MB/s]\u001b[A\u001b[A\n",
348
- "model-00003-of-00003.safetensors: 15%|█▌ | 178M/1.15G [00:04<00:24, 39.3MB/s]\u001b[A\n",
349
- "\n",
350
- "model-00002-of-00003.safetensors: 6%|▌ | 294M/4.98G [00:04<01:18, 59.7MB/s]\u001b[A\u001b[A\n",
351
- "model-00003-of-00003.safetensors: 17%|█▋ | 199M/1.15G [00:04<00:18, 53.0MB/s]\u001b[A\n",
352
- "\n",
353
- "model-00002-of-00003.safetensors: 6%|▌ | 304M/4.98G [00:04<01:21, 57.5MB/s]\u001b[A\u001b[A\n",
354
- "model-00003-of-00003.safetensors: 18%|█▊ | 210M/1.15G [00:04<00:22, 42.1MB/s]\u001b[A\n",
355
- "\n",
356
- "model-00003-of-00003.safetensors: 19%|█▉ | 220M/1.15G [00:05<00:19, 47.1MB/s]\u001b[A\u001b[A\n",
357
- "\n",
358
- "model-00002-of-00003.safetensors: 7%|▋ | 336M/4.98G [00:05<01:19, 58.4MB/s]\u001b[A\u001b[A\n",
359
- "model-00001-of-00003.safetensors: 6%|▌ | 294M/4.98G [00:05<01:36, 48.7MB/s]\u001b[A\n",
360
- "\n",
361
- "model-00003-of-00003.safetensors: 21%|██ | 241M/1.15G [00:05<00:20, 43.7MB/s]\u001b[A\u001b[A\n",
362
- "model-00001-of-00003.safetensors: 6%|▌ | 304M/4.98G [00:05<01:51, 42.0MB/s]\u001b[A\n",
363
- "\n",
364
- "model-00002-of-00003.safetensors: 7%|▋ | 357M/4.98G [00:05<01:32, 49.8MB/s]\u001b[A\u001b[A\n",
365
- "model-00001-of-00003.safetensors: 6%|▋ | 315M/4.98G [00:05<01:42, 45.4MB/s]\u001b[A\n",
366
- "\n",
367
- "model-00003-of-00003.safetensors: 22%|██▏ | 252M/1.15G [00:05<00:21, 41.3MB/s]\u001b[A\u001b[A\n",
368
- "\n",
369
- "model-00003-of-00003.safetensors: 23%|██▎ | 262M/1.15G [00:05<00:18, 48.4MB/s]\u001b[A\u001b[A\n",
370
- "\n",
371
- "model-00002-of-00003.safetensors: 8%|▊ | 388M/4.98G [00:06<01:23, 55.1MB/s]\u001b[A\u001b[A\n",
372
- "model-00003-of-00003.safetensors: 24%|██▎ | 273M/1.15G [00:06<00:18, 48.6MB/s]\u001b[A\n",
373
- "model-00003-of-00003.safetensors: 25%|██▌ | 294M/1.15G [00:06<00:14, 61.2MB/s]\u001b[A\n",
374
- "model-00001-of-00003.safetensors: 7%|▋ | 346M/4.98G [00:06<01:34, 48.9MB/s]\u001b[A\n",
375
- "\n",
376
- "model-00002-of-00003.safetensors: 8%|▊ | 409M/4.98G [00:06<01:17, 58.7MB/s]\u001b[A\u001b[A\n",
377
- "\n",
378
- "model-00002-of-00003.safetensors: 8%|▊ | 419M/4.98G [00:06<01:12, 63.3MB/s]\u001b[A\u001b[A\n",
379
- "model-00003-of-00003.safetensors: 29%|██▉ | 336M/1.15G [00:06<00:09, 83.7MB/s]\u001b[A\n",
380
- "\n",
381
- "model-00002-of-00003.safetensors: 9%|▉ | 440M/4.98G [00:06<01:01, 73.6MB/s]\u001b[A\u001b[A\n",
382
- "model-00001-of-00003.safetensors: 8%|▊ | 377M/4.98G [00:06<01:16, 60.6MB/s]\u001b[A\n",
383
- "\n",
384
- "model-00003-of-00003.safetensors: 30%|██▉ | 346M/1.15G [00:06<00:10, 76.1MB/s]\u001b[A\u001b[A\n",
385
- "model-00001-of-00003.safetensors: 8%|▊ | 388M/4.98G [00:07<01:18, 58.2MB/s]\u001b[A\n",
386
- "\n",
387
- "model-00003-of-00003.safetensors: 31%|███ | 357M/1.15G [00:07<00:14, 53.4MB/s]\u001b[A\u001b[A\n",
388
- "model-00001-of-00003.safetensors: 8%|▊ | 398M/4.98G [00:07<01:27, 52.6MB/s]\u001b[A\n",
389
- "\n",
390
- "model-00002-of-00003.safetensors: 10%|▉ | 482M/4.98G [00:07<01:14, 60.6MB/s]\u001b[A\u001b[A\n",
391
- "model-00003-of-00003.safetensors: 33%|███▎ | 377M/1.15G [00:07<00:12, 62.3MB/s]\u001b[A\n",
392
- "model-00001-of-00003.safetensors: 8%|▊ | 419M/4.98G [00:07<01:27, 52.4MB/s]\u001b[A\n",
393
- "\n",
394
- "model-00003-of-00003.safetensors: 34%|███▎ | 388M/1.15G [00:07<00:15, 50.9MB/s]\u001b[A\u001b[A\n",
395
- "model-00001-of-00003.safetensors: 9%|▉ | 440M/4.98G [00:07<01:12, 62.9MB/s]\u001b[A\n",
396
- "\n",
397
- "model-00003-of-00003.safetensors: 35%|███▌ | 409M/1.15G [00:08<00:12, 57.7MB/s]\u001b[A\u001b[A\n",
398
- "model-00003-of-00003.safetensors: 36%|███▋ | 419M/1.15G [00:08<00:12, 59.2MB/s]\u001b[A\n",
399
- "\n",
400
- "model-00002-of-00003.safetensors: 11%|█ | 535M/4.98G [00:08<01:21, 54.9MB/s]\u001b[A\u001b[A\n",
401
- "model-00003-of-00003.safetensors: 38%|███▊ | 440M/1.15G [00:08<00:11, 64.5MB/s]\u001b[A\n",
402
- "model-00001-of-00003.safetensors: 10%|▉ | 482M/4.98G [00:08<01:16, 59.0MB/s]\u001b[A\n",
403
- "\n",
404
- "model-00002-of-00003.safetensors: 11%|█ | 545M/4.98G [00:08<01:39, 44.6MB/s]\u001b[A\u001b[A\n",
405
- "model-00003-of-00003.safetensors: 39%|███▉ | 451M/1.15G [00:09<00:14, 49.7MB/s]\u001b[A\n",
406
- "\n",
407
- "model-00003-of-00003.safetensors: 40%|███▉ | 461M/1.15G [00:09<00:12, 53.8MB/s]\u001b[A\u001b[A\n",
408
- "model-00003-of-00003.safetensors: 41%|████ | 472M/1.15G [00:09<00:12, 56.4MB/s]\u001b[A\n",
409
- "\n",
410
- "model-00003-of-00003.safetensors: 42%|████▏ | 482M/1.15G [00:09<00:11, 56.5MB/s]\u001b[A\u001b[A\n",
411
- "\n",
412
- "model-00002-of-00003.safetensors: 12%|█▏ | 598M/4.98G [00:09<01:24, 52.2MB/s]\u001b[A\u001b[A\n",
413
- "model-00003-of-00003.safetensors: 44%|████▎ | 503M/1.15G [00:09<00:09, 69.6MB/s]\u001b[A\n",
414
- "\n",
415
- "model-00002-of-00003.safetensors: 12%|█▏ | 608M/4.98G [00:09<01:24, 51.6MB/s]\u001b[A\u001b[A\n",
416
- "model-00003-of-00003.safetensors: 45%|████▍ | 514M/1.15G [00:09<00:10, 59.1MB/s]\u001b[A\n",
417
- "\n",
418
- "model-00002-of-00003.safetensors: 12%|█▏ | 619M/4.98G [00:10<01:23, 52.1MB/s]\u001b[A\u001b[A\n",
419
- "model-00003-of-00003.safetensors: 46%|████▋ | 535M/1.15G [00:10<00:08, 71.5MB/s]\u001b[A\n",
420
- "\n",
421
- "model-00002-of-00003.safetensors: 13%|█▎ | 629M/4.98G [00:10<01:18, 55.5MB/s]\u001b[A\u001b[A\n",
422
- "\n",
423
- "model-00003-of-00003.safetensors: 47%|████▋ | 545M/1.15G [00:10<00:09, 67.2MB/s]\u001b[A\u001b[A\n",
424
- "model-00001-of-00003.safetensors: 11%|█▏ | 566M/4.98G [00:10<01:26, 51.3MB/s]\u001b[A\n",
425
- "\n",
426
- "model-00002-of-00003.safetensors: 13%|█▎ | 650M/4.98G [00:10<01:06, 65.6MB/s]\u001b[A\u001b[A\n",
427
- "\n",
428
- "model-00002-of-00003.safetensors: 13%|█▎ | 661M/4.98G [00:10<00:59, 72.8MB/s]\u001b[A\u001b[A\n",
429
- "\n",
430
- "model-00002-of-00003.safetensors: 14%|█▎ | 682M/4.98G [00:10<00:53, 81.0MB/s]\u001b[A\u001b[A\n",
431
- "model-00003-of-00003.safetensors: 49%|████▉ | 566M/1.15G [00:11<00:12, 46.4MB/s]\u001b[A\n",
432
- "\n",
433
- "model-00002-of-00003.safetensors: 14%|█▍ | 692M/4.98G [00:11<01:10, 60.8MB/s]\u001b[A\u001b[A\n",
434
- "model-00003-of-00003.safetensors: 52%|█████▏ | 598M/1.15G [00:11<00:09, 58.9MB/s]\u001b[A\n",
435
- "model-00003-of-00003.safetensors: 53%|█████▎ | 608M/1.15G [00:11<00:09, 56.4MB/s]\u001b[A\n",
436
- "\n",
437
- "model-00002-of-00003.safetensors: 14%|█▍ | 703M/4.98G [00:11<01:57, 36.5MB/s]\u001b[A\u001b[A\n",
438
- "model-00001-of-00003.safetensors: 13%|█▎ | 629M/4.98G [00:11<01:22, 52.9MB/s]\u001b[A\n",
439
- "\n",
440
- "model-00002-of-00003.safetensors: 15%|█▍ | 744M/4.98G [00:11<00:59, 70.6MB/s]\u001b[A\u001b[A\n",
441
- "model-00003-of-00003.safetensors: 55%|█████▍ | 629M/1.15G [00:12<00:08, 59.7MB/s]\u001b[A\n",
442
- "model-00001-of-00003.safetensors: 13%|█▎ | 650M/4.98G [00:12<01:11, 60.4MB/s]\u001b[A\n",
443
- "\n",
444
- "model-00003-of-00003.safetensors: 55%|█████▌ | 640M/1.15G [00:12<00:08, 62.1MB/s]\u001b[A\u001b[A\n",
445
- "\n",
446
- "model-00003-of-00003.safetensors: 56%|█████▋ | 650M/1.15G [00:12<00:08, 61.3MB/s]\u001b[A\u001b[A\n",
447
- "model-00001-of-00003.safetensors: 13%|█▎ | 661M/4.98G [00:12<01:19, 54.3MB/s]\u001b[A\n",
448
- "\n",
449
- "model-00002-of-00003.safetensors: 16%|█▌ | 776M/4.98G [00:12<01:09, 60.9MB/s]\u001b[A\u001b[A\n",
450
- "model-00003-of-00003.safetensors: 57%|█████▋ | 661M/1.15G [00:13<00:18, 26.1MB/s]\u001b[A\n",
451
- "model-00001-of-00003.safetensors: 14%|█▍ | 692M/4.98G [00:13<02:04, 34.4MB/s]\u001b[A\n",
452
- "\n",
453
- "model-00003-of-00003.safetensors: 58%|█████▊ | 671M/1.15G [00:14<00:26, 18.4MB/s]\u001b[A\u001b[A\n",
454
- "\n",
455
- "model-00002-of-00003.safetensors: 16%|█▌ | 797M/4.98G [00:14<03:36, 19.4MB/s]\u001b[A\u001b[A\n",
456
- "model-00003-of-00003.safetensors: 61%|██████ | 703M/1.15G [00:14<00:12, 36.5MB/s]\u001b[A\n",
457
- "model-00001-of-00003.safetensors: 15%|█▌ | 755M/4.98G [00:14<01:21, 52.1MB/s]\u001b[A\n",
458
- "\n",
459
- "model-00003-of-00003.safetensors: 65%|██████▌ | 755M/1.15G [00:14<00:05, 74.6MB/s]\u001b[A\u001b[A\n",
460
- "\n",
461
- "model-00002-of-00003.safetensors: 18%|█▊ | 881M/4.98G [00:14<00:55, 74.5MB/s]\u001b[A\u001b[A\n",
462
- "model-00003-of-00003.safetensors: 68%|██████▊ | 786M/1.15G [00:14<00:04, 87.3MB/s]\u001b[A\n",
463
- "\n",
464
- "model-00003-of-00003.safetensors: 70%|██████▉ | 807M/1.15G [00:15<00:03, 92.4MB/s]\u001b[A\u001b[A\n",
465
- "\n",
466
- "model-00002-of-00003.safetensors: 19%|█▊ | 923M/4.98G [00:15<00:53, 76.6MB/s]\u001b[A\u001b[A\n",
467
- "model-00001-of-00003.safetensors: 16%|█▌ | 797M/4.98G [00:15<01:22, 50.6MB/s]\u001b[A\n",
468
- "model-00001-of-00003.safetensors: 16%|█▋ | 818M/4.98G [00:15<01:26, 48.1MB/s]\u001b[A\n",
469
- "model-00003-of-00003.safetensors: 72%|███████▏ | 828M/1.15G [00:16<00:07, 42.6MB/s]\u001b[A\n",
470
- "\n",
471
- "model-00003-of-00003.safetensors: 75%|███████▌ | 870M/1.15G [00:16<00:04, 67.9MB/s]\u001b[A\u001b[A\n",
472
- "model-00003-of-00003.safetensors: 78%|███████▊ | 902M/1.15G [00:17<00:05, 43.1MB/s]\u001b[A\n",
473
- "\n",
474
- "model-00002-of-00003.safetensors: 20%|█▉ | 975M/4.98G [00:17<02:05, 32.0MB/s]\u001b[A\u001b[A\n",
475
- "model-00001-of-00003.safetensors: 17%|█▋ | 849M/4.98G [00:17<03:05, 22.3MB/s]\u001b[A\n",
476
- "\n",
477
- "model-00003-of-00003.safetensors: 81%|████████ | 933M/1.15G [00:19<00:06, 36.5MB/s]]\u001b[A\u001b[A\n",
478
- "model-00001-of-00003.safetensors: 17%|█▋ | 870M/4.98G [00:19<03:20, 20.5MB/s]\u001b[A\n",
479
- "\n",
480
- "model-00003-of-00003.safetensors: 85%|████████▍ | 975M/1.15G [00:19<00:03, 54.8MB/s]]\u001b[A\u001b[A\n",
481
- "model-00001-of-00003.safetensors: 18%|█▊ | 912M/4.98G [00:19<01:40, 40.6MB/s]\u001b[A\n",
482
- "\n",
483
- "model-00002-of-00003.safetensors: 22%|██▏ | 1.08G/4.98G [00:19<01:04, 60.2MB/s]\u001b[A\u001b[A\n",
484
- "\n",
485
- "model-00002-of-00003.safetensors: 22%|██▏ | 1.11G/4.98G [00:19<00:50, 77.2MB/s]\u001b[A\u001b[A\n",
486
- "model-00003-of-00003.safetensors: 93%|█████████▎| 1.07G/1.15G [00:20<00:01, 73.8MB/s][A\n",
487
- "model-00003-of-00003.safetensors: 95%|█████████▍| 1.09G/1.15G [00:20<00:00, 72.8MB/s][A\n",
488
- "\n",
489
- "model-00002-of-00003.safetensors: 23%|██▎ | 1.14G/4.98G [00:20<01:20, 47.4MB/s]\u001b[A\u001b[A\n",
490
- "model-00003-of-00003.safetensors: 96%|█████████▋| 1.11G/1.15G [00:20<00:00, 69.0MB/s][A\n",
491
- "\n",
492
- "model-00002-of-00003.safetensors: 24%|██▍ | 1.18G/4.98G [00:20<00:55, 68.9MB/s]\u001b[A\u001b[A\n",
493
- "model-00001-of-00003.safetensors: 20%|█▉ | 996M/4.98G [00:20<01:19, 50.1MB/s]\u001b[A\n",
494
- "\n",
495
- "model-00003-of-00003.safetensors: 97%|█████████▋| 1.12G/1.15G [00:20<00:00, 68.7MB/s]\u001b[A\u001b[A\n",
496
- "model-00001-of-00003.safetensors: 20%|██ | 1.02G/4.98G [00:20<01:10, 56.5MB/s]\u001b[A\n",
497
- "\n",
498
- "model-00002-of-00003.safetensors: 25%|██▌ | 1.25G/4.98G [00:21<00:42, 88.8MB/s]\u001b[A\u001b[A\n",
499
- "model-00003-of-00003.safetensors: 99%|█████████▉| 1.14G/1.15G [00:21<00:00, 53.6MB/s]\u001b[A\n",
500
- "\n",
501
- "model-00003-of-00003.safetensors: 100%|██████████| 1.15G/1.15G [00:21<00:00, 53.4MB/s]\u001b[A\u001b[A\n",
502
- "\n",
503
- "model-00001-of-00003.safetensors: 21%|██ | 1.05G/4.98G [00:21<01:14, 52.8MB/s]\u001b[A\n",
504
- "model-00001-of-00003.safetensors: 21%|██▏ | 1.06G/4.98G [00:21<01:23, 46.8MB/s]\u001b[A\n",
505
- "\n",
506
- "model-00002-of-00003.safetensors: 26%|██▌ | 1.29G/4.98G [00:22<01:06, 55.4MB/s]\u001b[A\u001b[A\n",
507
- "model-00001-of-00003.safetensors: 22%|██▏ | 1.08G/4.98G [00:22<01:18, 49.6MB/s]\u001b[A\n",
508
- "model-00001-of-00003.safetensors: 22%|██▏ | 1.09G/4.98G [00:22<01:15, 51.6MB/s]\u001b[A\n",
509
- "\n",
510
- "model-00002-of-00003.safetensors: 26%|██▋ | 1.31G/4.98G [00:22<01:05, 56.0MB/s]\u001b[A\u001b[A\n",
511
- "model-00001-of-00003.safetensors: 22%|██▏ | 1.11G/4.98G [00:22<01:13, 52.7MB/s]\u001b[A\n",
512
- "model-00001-of-00003.safetensors: 23%|██▎ | 1.12G/4.98G [00:23<01:25, 45.0MB/s]\u001b[A\n",
513
- "\n",
514
- "model-00002-of-00003.safetensors: 27%|██▋ | 1.32G/4.98G [00:23<01:31, 40.0MB/s]\u001b[A\u001b[A\n",
515
- "model-00001-of-00003.safetensors: 23%|██▎ | 1.14G/4.98G [00:23<01:15, 50.8MB/s]\u001b[A\n",
516
- "\n",
517
- "model-00002-of-00003.safetensors: 27%|██▋ | 1.33G/4.98G [00:23<01:33, 39.1MB/s]\u001b[A\u001b[A\n",
518
- "\n",
519
- "model-00002-of-00003.safetensors: 27%|██▋ | 1.34G/4.98G [00:23<01:31, 39.9MB/s]\u001b[A\u001b[A\n",
520
- "model-00001-of-00003.safetensors: 23%|██▎ | 1.15G/4.98G [00:23<01:24, 45.5MB/s]\u001b[A\n",
521
- "\n",
522
- "model-00002-of-00003.safetensors: 27%|██▋ | 1.36G/4.98G [00:24<01:14, 48.4MB/s]\u001b[A\u001b[A\n",
523
- "model-00001-of-00003.safetensors: 24%|██▎ | 1.17G/4.98G [00:24<01:18, 48.7MB/s]\u001b[A\n",
524
- "model-00001-of-00003.safetensors: 24%|██▍ | 1.18G/4.98G [00:24<01:24, 45.1MB/s]\u001b[A\n",
525
- "\n",
526
- "model-00002-of-00003.safetensors: 28%|██▊ | 1.38G/4.98G [00:24<01:20, 44.7MB/s]\u001b[A\u001b[A\n",
527
- "model-00001-of-00003.safetensors: 24%|██▍ | 1.21G/4.98G [00:24<01:12, 52.1MB/s]\u001b[A\n",
528
- "\n",
529
- "model-00002-of-00003.safetensors: 28%|██▊ | 1.39G/4.98G [00:24<01:19, 45.0MB/s]\u001b[A\u001b[A\n",
530
- "model-00001-of-00003.safetensors: 24%|██▍ | 1.22G/4.98G [00:25<01:30, 41.8MB/s]\u001b[A\n",
531
- "model-00001-of-00003.safetensors: 25%|██▍ | 1.24G/4.98G [00:25<01:11, 52.1MB/s]\u001b[A\n",
532
- "model-00001-of-00003.safetensors: 25%|██▌ | 1.25G/4.98G [00:25<01:08, 54.3MB/s]\u001b[A\n",
533
- "model-00001-of-00003.safetensors: 25%|██▌ | 1.26G/4.98G [00:25<01:03, 58.3MB/s]\u001b[A\n",
534
- "\n",
535
- "model-00002-of-00003.safetensors: 28%|██▊ | 1.41G/4.98G [00:25<02:25, 24.7MB/s]\u001b[A\u001b[A\n",
536
- "model-00001-of-00003.safetensors: 25%|██▌ | 1.27G/4.98G [00:26<01:04, 57.8MB/s]\u001b[A\n",
537
- "\n",
538
- "model-00002-of-00003.safetensors: 29%|██▉ | 1.45G/4.98G [00:26<01:09, 51.1MB/s]\u001b[A\u001b[A\n",
539
- "model-00001-of-00003.safetensors: 26%|██▌ | 1.28G/4.98G [00:26<00:57, 64.4MB/s]\u001b[A\n",
540
- "model-00001-of-00003.safetensors: 26%|██▌ | 1.29G/4.98G [00:26<01:03, 58.3MB/s]\u001b[A\n",
541
- "model-00001-of-00003.safetensors: 26%|██▌ | 1.30G/4.98G [00:26<01:09, 53.1MB/s]\u001b[A\n",
542
- "\n",
543
- "model-00002-of-00003.safetensors: 30%|██▉ | 1.49G/4.98G [00:26<00:57, 61.2MB/s]\u001b[A\u001b[A\n",
544
- "model-00001-of-00003.safetensors: 26%|██▋ | 1.31G/4.98G [00:26<01:00, 60.9MB/s]\u001b[A\n",
545
- "model-00001-of-00003.safetensors: 27%|██▋ | 1.32G/4.98G [00:26<01:09, 53.0MB/s]\u001b[A\n",
546
- "\n",
547
- "model-00002-of-00003.safetensors: 30%|███ | 1.51G/4.98G [00:27<01:03, 54.6MB/s]\u001b[A\u001b[A\n",
548
- "model-00001-of-00003.safetensors: 27%|██▋ | 1.33G/4.98G [00:27<01:07, 54.1MB/s]\u001b[A\n",
549
- "\n",
550
- "model-00002-of-00003.safetensors: 31%|███ | 1.52G/4.98G [00:27<01:07, 51.3MB/s]\u001b[A\u001b[A\n",
551
- "model-00001-of-00003.safetensors: 27%|██▋ | 1.35G/4.98G [00:27<01:02, 58.3MB/s]\u001b[A\n",
552
- "model-00001-of-00003.safetensors: 27%|██▋ | 1.36G/4.98G [00:27<01:08, 52.6MB/s]\u001b[A\n",
553
- "model-00001-of-00003.safetensors: 28%|██▊ | 1.37G/4.98G [00:27<01:10, 51.2MB/s]\u001b[A\n",
554
- "\n",
555
- "model-00002-of-00003.safetensors: 31%|███ | 1.54G/4.98G [00:27<01:15, 45.7MB/s]\u001b[A\u001b[A\n",
556
- "model-00001-of-00003.safetensors: 28%|██▊ | 1.38G/4.98G [00:28<01:03, 56.4MB/s]\u001b[A\n",
557
- "\n",
558
- "model-00002-of-00003.safetensors: 31%|███ | 1.55G/4.98G [00:28<01:11, 47.7MB/s]\u001b[A\u001b[A\n",
559
- "\n",
560
- "model-00002-of-00003.safetensors: 31%|███▏ | 1.56G/4.98G [00:28<01:05, 52.1MB/s]\u001b[A\u001b[A\n",
561
- "model-00001-of-00003.safetensors: 28%|██▊ | 1.39G/4.98G [00:28<01:12, 49.6MB/s]\u001b[A\n",
562
- "model-00001-of-00003.safetensors: 28%|██▊ | 1.41G/4.98G [00:28<01:03, 56.5MB/s]\u001b[A\n",
563
- "\n",
564
- "model-00002-of-00003.safetensors: 32%|███▏ | 1.57G/4.98G [00:28<01:09, 49.2MB/s]\u001b[A\u001b[A\n",
565
- "\n",
566
- "model-00002-of-00003.safetensors: 32%|███▏ | 1.59G/4.98G [00:28<00:51, 66.4MB/s]\u001b[A\u001b[A\n",
567
- "model-00001-of-00003.safetensors: 28%|██▊ | 1.42G/4.98G [00:28<01:17, 46.3MB/s]\u001b[A\n",
568
- "\n",
569
- "model-00002-of-00003.safetensors: 32%|███▏ | 1.60G/4.98G [00:28<00:51, 66.0MB/s]\u001b[A\u001b[A\n",
570
- "model-00001-of-00003.safetensors: 29%|██▊ | 1.43G/4.98G [00:29<01:23, 42.8MB/s]\u001b[A\n",
571
- "\n",
572
- "model-00002-of-00003.safetensors: 33%|███▎ | 1.63G/4.98G [00:29<00:54, 61.8MB/s]\u001b[A\u001b[A\n",
573
- "model-00001-of-00003.safetensors: 29%|██▉ | 1.44G/4.98G [00:29<01:12, 49.1MB/s]\u001b[A\n",
574
- "\n",
575
- "model-00002-of-00003.safetensors: 33%|███▎ | 1.64G/4.98G [00:29<00:51, 64.7MB/s]\u001b[A\u001b[A\n",
576
- "model-00001-of-00003.safetensors: 29%|██▉ | 1.45G/4.98G [00:29<01:12, 48.8MB/s]\u001b[A\n",
577
- "model-00001-of-00003.safetensors: 29%|██▉ | 1.46G/4.98G [00:29<01:06, 52.7MB/s]\u001b[A\n",
578
- "\n",
579
- "model-00002-of-00003.safetensors: 33%|███▎ | 1.66G/4.98G [00:29<00:51, 65.0MB/s]\u001b[A\u001b[A\n",
580
- "model-00001-of-00003.safetensors: 30%|██▉ | 1.48G/4.98G [00:30<01:10, 49.4MB/s]\u001b[A\n",
581
- "model-00001-of-00003.safetensors: 30%|██▉ | 1.49G/4.98G [00:30<01:04, 54.3MB/s]\u001b[A\n",
582
- "model-00001-of-00003.safetensors: 30%|███ | 1.51G/4.98G [00:30<00:55, 62.2MB/s]\u001b[A\n",
583
- "model-00001-of-00003.safetensors: 31%|███ | 1.52G/4.98G [00:30<00:57, 60.4MB/s]\u001b[A\n",
584
- "model-00001-of-00003.safetensors: 31%|███ | 1.54G/4.98G [00:30<00:47, 72.7MB/s]\u001b[A\n",
585
- "model-00001-of-00003.safetensors: 31%|███ | 1.55G/4.98G [00:31<00:54, 63.5MB/s]\u001b[A\n",
586
- "\n",
587
- "model-00002-of-00003.safetensors: 33%|███▎ | 1.67G/4.98G [00:31<02:21, 23.5MB/s]\u001b[A\u001b[A\n",
588
- "\n",
589
- "model-00002-of-00003.safetensors: 34%|███▍ | 1.71G/4.98G [00:31<01:07, 48.4MB/s]\u001b[A\u001b[A\n",
590
- "model-00001-of-00003.safetensors: 31%|███▏ | 1.56G/4.98G [00:31<00:56, 60.2MB/s]\u001b[A\n",
591
- "\n",
592
- "model-00002-of-00003.safetensors: 35%|███▌ | 1.75G/4.98G [00:31<00:46, 69.8MB/s]\u001b[A\u001b[A\n",
593
- "model-00001-of-00003.safetensors: 32%|███▏ | 1.57G/4.98G [00:31<01:05, 52.0MB/s]\u001b[A\n",
594
- "\n",
595
- "model-00002-of-00003.safetensors: 36%|███▌ | 1.77G/4.98G [00:31<00:45, 70.0MB/s]\u001b[A\u001b[A\n",
596
- "model-00001-of-00003.safetensors: 32%|███▏ | 1.59G/4.98G [00:31<00:59, 56.5MB/s]\u001b[A\n",
597
- "model-00001-of-00003.safetensors: 32%|███▏ | 1.60G/4.98G [00:32<01:13, 46.1MB/s]\u001b[A\n",
598
- "\n",
599
- "model-00002-of-00003.safetensors: 36%|███▌ | 1.79G/4.98G [00:32<00:55, 57.0MB/s]\u001b[A\u001b[A\n",
600
- "\n",
601
- "model-00002-of-00003.safetensors: 36%|███▋ | 1.81G/4.98G [00:32<00:49, 63.8MB/s]\u001b[A\u001b[A\n",
602
- "model-00001-of-00003.safetensors: 33%|███▎ | 1.63G/4.98G [00:32<01:06, 50.4MB/s]\u001b[A\n",
603
- "model-00001-of-00003.safetensors: 33%|███▎ | 1.64G/4.98G [00:32<01:02, 53.3MB/s]\u001b[A\n",
604
- "\n",
605
- "model-00002-of-00003.safetensors: 37%|███▋ | 1.82G/4.98G [00:32<00:56, 55.7MB/s]\u001b[A\u001b[A\n",
606
- "model-00001-of-00003.safetensors: 33%|███▎ | 1.66G/4.98G [00:33<00:54, 61.0MB/s]\u001b[A\n",
607
- "\n",
608
- "model-00002-of-00003.safetensors: 37%|███▋ | 1.85G/4.98G [00:33<00:52, 59.9MB/s]\u001b[A\u001b[A\n",
609
- "model-00001-of-00003.safetensors: 33%|███▎ | 1.67G/4.98G [00:33<01:04, 51.3MB/s]\u001b[A\n",
610
- "\n",
611
- "model-00002-of-00003.safetensors: 37%|███▋ | 1.86G/4.98G [00:33<00:50, 61.7MB/s]\u001b[A\u001b[A\n",
612
- "\n",
613
- "model-00002-of-00003.safetensors: 37%|███▋ | 1.87G/4.98G [00:33<00:46, 67.0MB/s]\u001b[A\u001b[A\n",
614
- "model-00001-of-00003.safetensors: 34%|███▍ | 1.69G/4.98G [00:33<00:55, 59.5MB/s]\u001b[A\n",
615
- "\n",
616
- "model-00002-of-00003.safetensors: 38%|███▊ | 1.88G/4.98G [00:33<00:48, 64.3MB/s]\u001b[A\u001b[A\n",
617
- "model-00001-of-00003.safetensors: 34%|███▍ | 1.70G/4.98G [00:33<00:52, 62.7MB/s]\u001b[A\n",
618
- "model-00001-of-00003.safetensors: 35%|███▍ | 1.72G/4.98G [00:33<00:42, 76.9MB/s]\u001b[A\n",
619
- "model-00001-of-00003.safetensors: 35%|███▍ | 1.73G/4.98G [00:34<00:47, 68.8MB/s]\u001b[A\n",
620
- "\n",
621
- "model-00002-of-00003.safetensors: 38%|███▊ | 1.90G/4.98G [00:34<00:57, 53.8MB/s]\u001b[A\u001b[A\n",
622
- "\n",
623
- "model-00002-of-00003.safetensors: 38%|███▊ | 1.91G/4.98G [00:34<01:02, 48.9MB/s]\u001b[A\u001b[A\n",
624
- "model-00001-of-00003.safetensors: 35%|███▌ | 1.75G/4.98G [00:34<00:48, 66.3MB/s]\u001b[A\n",
625
- "model-00001-of-00003.safetensors: 35%|███▌ | 1.76G/4.98G [00:34<00:45, 70.0MB/s]\u001b[A\n",
626
- "\n",
627
- "model-00002-of-00003.safetensors: 39%|███▊ | 1.93G/4.98G [00:34<00:58, 52.1MB/s]\u001b[A\u001b[A\n",
628
- "model-00001-of-00003.safetensors: 36%|███▌ | 1.78G/4.98G [00:34<00:46, 68.6MB/s]\u001b[A\n",
629
- "\n",
630
- "model-00002-of-00003.safetensors: 39%|███▉ | 1.94G/4.98G [00:34<00:59, 50.8MB/s]\u001b[A\u001b[A\n",
631
- "\n",
632
- "model-00002-of-00003.safetensors: 39%|███▉ | 1.96G/4.98G [00:35<00:47, 64.2MB/s]\u001b[A\u001b[A\n",
633
- "model-00001-of-00003.safetensors: 36%|███▌ | 1.79G/4.98G [00:35<00:57, 55.1MB/s]\u001b[A\n",
634
- "\n",
635
- "model-00002-of-00003.safetensors: 40%|███▉ | 1.97G/4.98G [00:35<00:46, 64.4MB/s]\u001b[A\u001b[A\n",
636
- "model-00001-of-00003.safetensors: 36%|███▋ | 1.81G/4.98G [00:35<00:43, 72.5MB/s]\u001b[A\n",
637
- "\n",
638
- "model-00002-of-00003.safetensors: 40%|███▉ | 1.98G/4.98G [00:35<00:46, 63.9MB/s]\u001b[A\u001b[A\n",
639
- "model-00001-of-00003.safetensors: 37%|███▋ | 1.82G/4.98G [00:35<00:46, 68.3MB/s]\u001b[A\n",
640
- "\n",
641
- "model-00002-of-00003.safetensors: 40%|███▉ | 1.99G/4.98G [00:35<00:44, 67.5MB/s]\u001b[A\u001b[A\n",
642
- "model-00001-of-00003.safetensors: 37%|███▋ | 1.84G/4.98G [00:35<00:48, 65.1MB/s]\u001b[A\n",
643
- "\n",
644
- "model-00002-of-00003.safetensors: 40%|████ | 2.00G/4.98G [00:36<01:00, 49.1MB/s]\u001b[A\u001b[A\n",
645
- "model-00001-of-00003.safetensors: 37%|███▋ | 1.85G/4.98G [00:36<01:02, 50.0MB/s]\u001b[A\n",
646
- "\n",
647
- "model-00002-of-00003.safetensors: 41%|████ | 2.02G/4.98G [00:36<00:43, 67.7MB/s]\u001b[A\u001b[A\n",
648
- "model-00001-of-00003.safetensors: 37%|███▋ | 1.86G/4.98G [00:36<00:55, 56.1MB/s]\u001b[A\n",
649
- "model-00001-of-00003.safetensors: 37%|███▋ | 1.87G/4.98G [00:36<00:53, 57.9MB/s]\u001b[A\n",
650
- "\n",
651
- "model-00002-of-00003.safetensors: 41%|████ | 2.03G/4.98G [00:36<00:53, 54.6MB/s]\u001b[A\u001b[A\n",
652
- "\n",
653
- "model-00002-of-00003.safetensors: 41%|████ | 2.06G/4.98G [00:36<00:42, 69.0MB/s]\u001b[A\u001b[A\n",
654
- "model-00001-of-00003.safetensors: 38%|███▊ | 1.88G/4.98G [00:37<01:29, 34.9MB/s]\u001b[A\n",
655
- "\n",
656
- "model-00002-of-00003.safetensors: 41%|████▏ | 2.07G/4.98G [00:37<00:54, 53.3MB/s]\u001b[A\u001b[A\n",
657
- "model-00001-of-00003.safetensors: 38%|███▊ | 1.89G/4.98G [00:37<01:12, 42.8MB/s]\u001b[A\n",
658
- "\n",
659
- "model-00002-of-00003.safetensors: 42%|████▏ | 2.09G/4.98G [00:37<00:47, 61.4MB/s]\u001b[A\u001b[A\n",
660
- "\n",
661
- "model-00002-of-00003.safetensors: 42%|████▏ | 2.10G/4.98G [00:37<00:50, 57.1MB/s]\u001b[A\u001b[A\n",
662
- "model-00001-of-00003.safetensors: 38%|███▊ | 1.90G/4.98G [00:37<01:29, 34.4MB/s]\u001b[A\n",
663
- "model-00001-of-00003.safetensors: 38%|███▊ | 1.91G/4.98G [00:37<01:18, 39.3MB/s]\u001b[A\n",
664
- "\n",
665
- "model-00002-of-00003.safetensors: 43%|████▎ | 2.12G/4.98G [00:37<00:47, 60.8MB/s]\u001b[A\u001b[A\n",
666
- "\n",
667
- "model-00002-of-00003.safetensors: 43%|████▎ | 2.13G/4.98G [00:37<00:46, 62.0MB/s]\u001b[A\u001b[A\n",
668
- "model-00001-of-00003.safetensors: 39%|███▊ | 1.93G/4.98G [00:38<01:02, 49.2MB/s]\u001b[A\n",
669
- "\n",
670
- "model-00002-of-00003.safetensors: 43%|████▎ | 2.15G/4.98G [00:38<00:45, 61.9MB/s]\u001b[A\u001b[A\n",
671
- "model-00001-of-00003.safetensors: 39%|███▉ | 1.94G/4.98G [00:38<01:08, 44.3MB/s]\u001b[A\n",
672
- "\n",
673
- "model-00002-of-00003.safetensors: 44%|████▎ | 2.17G/4.98G [00:38<00:35, 79.7MB/s]\u001b[A\u001b[A\n",
674
- "model-00001-of-00003.safetensors: 39%|███▉ | 1.96G/4.98G [00:38<00:54, 55.6MB/s]\u001b[A\n",
675
- "model-00001-of-00003.safetensors: 40%|███▉ | 1.97G/4.98G [00:38<00:54, 55.6MB/s]\u001b[A\n",
676
- "\n",
677
- "model-00002-of-00003.safetensors: 44%|████▍ | 2.18G/4.98G [00:39<01:04, 43.3MB/s]\u001b[A\u001b[A\n",
678
- "model-00001-of-00003.safetensors: 40%|███▉ | 1.99G/4.98G [00:39<00:56, 53.4MB/s]\u001b[A\n",
679
- "\n",
680
- "model-00002-of-00003.safetensors: 45%|████▍ | 2.22G/4.98G [00:39<00:33, 81.5MB/s]\u001b[A\u001b[A\n",
681
- "model-00001-of-00003.safetensors: 40%|████ | 2.00G/4.98G [00:39<00:58, 50.9MB/s]\u001b[A\n",
682
- "model-00001-of-00003.safetensors: 41%|████ | 2.02G/4.98G [00:39<00:52, 56.5MB/s]\u001b[A\n",
683
- "\n",
684
- "model-00002-of-00003.safetensors: 45%|████▌ | 2.24G/4.98G [00:39<00:43, 62.6MB/s]\u001b[A\u001b[A\n",
685
- "\n",
686
- "model-00002-of-00003.safetensors: 45%|████▌ | 2.26G/4.98G [00:40<00:40, 66.4MB/s]\u001b[A\u001b[A\n",
687
- "model-00001-of-00003.safetensors: 41%|████ | 2.03G/4.98G [00:40<01:08, 42.9MB/s]\u001b[A\n",
688
- "\n",
689
- "model-00002-of-00003.safetensors: 46%|████▌ | 2.29G/4.98G [00:40<00:43, 61.9MB/s]\u001b[A\u001b[A\n",
690
- "model-00001-of-00003.safetensors: 41%|████ | 2.04G/4.98G [00:40<01:20, 36.3MB/s]\u001b[A\n",
691
- "\n",
692
- "model-00002-of-00003.safetensors: 46%|████▋ | 2.31G/4.98G [00:40<00:38, 69.2MB/s]\u001b[A\u001b[A\n",
693
- "\n",
694
- "model-00002-of-00003.safetensors: 47%|████▋ | 2.33G/4.98G [00:40<00:32, 82.5MB/s]\u001b[A\u001b[A\n",
695
- "model-00001-of-00003.safetensors: 41%|████ | 2.06G/4.98G [00:41<01:24, 34.6MB/s]\u001b[A\n",
696
- "\n",
697
- "model-00002-of-00003.safetensors: 47%|████▋ | 2.35G/4.98G [00:41<00:30, 87.6MB/s]\u001b[A\u001b[A\n",
698
- "model-00001-of-00003.safetensors: 41%|████▏ | 2.07G/4.98G [00:41<01:14, 39.2MB/s]\u001b[A\n",
699
- "\n",
700
- "model-00002-of-00003.safetensors: 48%|████▊ | 2.37G/4.98G [00:41<00:34, 75.4MB/s]\u001b[A\u001b[A\n",
701
- "model-00001-of-00003.safetensors: 42%|████▏ | 2.09G/4.98G [00:41<00:59, 48.6MB/s]\u001b[A\n",
702
- "\n",
703
- "model-00002-of-00003.safetensors: 48%|████▊ | 2.38G/4.98G [00:42<01:16, 34.0MB/s]\u001b[A\u001b[A\n",
704
- "model-00001-of-00003.safetensors: 42%|████▏ | 2.10G/4.98G [00:42<01:54, 25.2MB/s]\u001b[A\n",
705
- "\n",
706
- "model-00002-of-00003.safetensors: 49%|████▊ | 2.42G/4.98G [00:42<00:40, 62.6MB/s]\u001b[A\u001b[A\n",
707
- "model-00001-of-00003.safetensors: 43%|████▎ | 2.15G/4.98G [00:42<00:46, 61.5MB/s]\u001b[A\n",
708
- "model-00001-of-00003.safetensors: 44%|████▎ | 2.17G/4.98G [00:42<00:37, 74.7MB/s]\u001b[A\n",
709
- "\n",
710
- "model-00002-of-00003.safetensors: 49%|████▉ | 2.44G/4.98G [00:42<00:39, 64.0MB/s]\u001b[A\u001b[A\n",
711
- "model-00001-of-00003.safetensors: 44%|████▍ | 2.19G/4.98G [00:42<00:33, 82.8MB/s]\u001b[A\n",
712
- "\n",
713
- "model-00002-of-00003.safetensors: 49%|████▉ | 2.46G/4.98G [00:43<00:39, 63.6MB/s]\u001b[A\u001b[A\n",
714
- "\n",
715
- "model-00002-of-00003.safetensors: 50%|████▉ | 2.49G/4.98G [00:43<00:33, 74.4MB/s]\u001b[A\u001b[A\n",
716
- "model-00001-of-00003.safetensors: 44%|████▍ | 2.21G/4.98G [00:43<00:45, 60.8MB/s]\u001b[A\n",
717
- "\n",
718
- "model-00002-of-00003.safetensors: 50%|█████ | 2.51G/4.98G [00:43<00:32, 76.9MB/s]\u001b[A\u001b[A\n",
719
- "model-00001-of-00003.safetensors: 45%|████▍ | 2.23G/4.98G [00:43<00:46, 58.6MB/s]\u001b[A\n",
720
- "model-00001-of-00003.safetensors: 45%|████▌ | 2.24G/4.98G [00:44<00:52, 51.8MB/s]\u001b[A\n",
721
- "\n",
722
- "model-00002-of-00003.safetensors: 51%|█████ | 2.53G/4.98G [00:44<00:43, 56.8MB/s]\u001b[A\u001b[A\n",
723
- "model-00001-of-00003.safetensors: 45%|████▌ | 2.26G/4.98G [00:44<00:45, 59.5MB/s]\u001b[A\n",
724
- "\n",
725
- "model-00002-of-00003.safetensors: 51%|█████ | 2.54G/4.98G [00:44<00:48, 50.3MB/s]\u001b[A\u001b[A\n",
726
- "model-00001-of-00003.safetensors: 46%|████▌ | 2.28G/4.98G [00:44<00:44, 60.7MB/s]\u001b[A\n",
727
- "\n",
728
- "model-00002-of-00003.safetensors: 51%|█████ | 2.55G/4.98G [00:44<00:48, 49.9MB/s]\u001b[A\u001b[A\n",
729
- "model-00001-of-00003.safetensors: 46%|████▌ | 2.30G/4.98G [00:45<00:47, 57.0MB/s]\u001b[A\n",
730
- "\n",
731
- "model-00002-of-00003.safetensors: 52%|█████▏ | 2.57G/4.98G [00:45<00:43, 55.7MB/s]\u001b[A\u001b[A\n",
732
- "\n",
733
- "model-00002-of-00003.safetensors: 52%|█████▏ | 2.58G/4.98G [00:45<00:51, 47.0MB/s]\u001b[A\u001b[A\n",
734
- "model-00001-of-00003.safetensors: 46%|████▋ | 2.31G/4.98G [00:45<01:03, 42.0MB/s]\u001b[A\n",
735
- "\n",
736
- "model-00002-of-00003.safetensors: 52%|█████▏ | 2.60G/4.98G [00:45<00:45, 52.8MB/s]\u001b[A\u001b[A\n",
737
- "\n",
738
- "model-00002-of-00003.safetensors: 52%|█████▏ | 2.61G/4.98G [00:45<00:43, 54.3MB/s]\u001b[A\u001b[A\n",
739
- "model-00001-of-00003.safetensors: 47%|████▋ | 2.33G/4.98G [00:46<01:11, 37.3MB/s]\u001b[A\n",
740
- "\n",
741
- "model-00002-of-00003.safetensors: 53%|█████▎ | 2.62G/4.98G [00:46<00:48, 49.0MB/s]\u001b[A\u001b[A\n",
742
- "\n",
743
- "model-00002-of-00003.safetensors: 53%|█████▎ | 2.63G/4.98G [00:46<00:44, 52.7MB/s]\u001b[A\u001b[A\n",
744
- "model-00001-of-00003.safetensors: 47%|████▋ | 2.34G/4.98G [00:46<01:08, 38.5MB/s]\u001b[A\n",
745
- "\n",
746
- "model-00002-of-00003.safetensors: 53%|█████▎ | 2.64G/4.98G [00:46<00:43, 53.8MB/s]\u001b[A\u001b[A\n",
747
- "model-00001-of-00003.safetensors: 47%|████▋ | 2.36G/4.98G [00:46<00:54, 47.9MB/s]\u001b[A\n",
748
- "\n",
749
- "model-00002-of-00003.safetensors: 53%|█████▎ | 2.66G/4.98G [00:46<00:38, 60.6MB/s]\u001b[A\u001b[A\n",
750
- "\n",
751
- "model-00002-of-00003.safetensors: 54%|█████▎ | 2.67G/4.98G [00:46<00:35, 64.7MB/s]\u001b[A\u001b[A\n",
752
- "model-00001-of-00003.safetensors: 48%|████▊ | 2.37G/4.98G [00:47<01:00, 43.5MB/s]\u001b[A\n",
753
- "\n",
754
- "model-00002-of-00003.safetensors: 54%|█████▍ | 2.69G/4.98G [00:47<00:33, 69.1MB/s]\u001b[A\u001b[A\n",
755
- "model-00001-of-00003.safetensors: 48%|████▊ | 2.39G/4.98G [00:47<00:53, 48.6MB/s]\u001b[A\n",
756
- "model-00001-of-00003.safetensors: 48%|████▊ | 2.40G/4.98G [00:47<00:54, 47.7MB/s]\u001b[A\n",
757
- "\n",
758
- "model-00002-of-00003.safetensors: 54%|█████▍ | 2.71G/4.98G [00:47<00:43, 52.8MB/s]\u001b[A\u001b[A\n",
759
- "model-00001-of-00003.safetensors: 49%|████▊ | 2.42G/4.98G [00:47<00:44, 57.3MB/s]\u001b[A\n",
760
- "\n",
761
- "model-00002-of-00003.safetensors: 55%|█████▍ | 2.73G/4.98G [00:47<00:36, 61.5MB/s]\u001b[A\u001b[A\n",
762
- "model-00001-of-00003.safetensors: 49%|████▉ | 2.43G/4.98G [00:48<00:41, 61.0MB/s]\u001b[A\n",
763
- "\n",
764
- "model-00002-of-00003.safetensors: 55%|█████▍ | 2.74G/4.98G [00:48<00:40, 55.6MB/s]\u001b[A\u001b[A\n",
765
- "model-00001-of-00003.safetensors: 49%|████▉ | 2.45G/4.98G [00:48<00:43, 58.5MB/s]\u001b[A\n",
766
- "\n",
767
- "model-00002-of-00003.safetensors: 55%|█████▌ | 2.76G/4.98G [00:48<00:40, 54.7MB/s]\u001b[A\u001b[A\n",
768
- "model-00001-of-00003.safetensors: 49%|████▉ | 2.46G/4.98G [00:48<00:51, 49.0MB/s]\u001b[A\n",
769
- "\n",
770
- "model-00002-of-00003.safetensors: 56%|█████▌ | 2.77G/4.98G [00:48<00:42, 51.6MB/s]\u001b[A\u001b[A\n",
771
- "\n",
772
- "model-00002-of-00003.safetensors: 56%|█████▌ | 2.79G/4.98G [00:48<00:34, 63.3MB/s]\u001b[A\u001b[A\n",
773
- "model-00001-of-00003.safetensors: 50%|████▉ | 2.49G/4.98G [00:49<00:47, 52.7MB/s]\u001b[A\n",
774
- "model-00001-of-00003.safetensors: 50%|█████ | 2.50G/4.98G [00:49<00:51, 48.1MB/s]\u001b[A\n",
775
- "\n",
776
- "model-00002-of-00003.safetensors: 56%|█████▌ | 2.80G/4.98G [00:49<00:44, 49.5MB/s]\u001b[A\u001b[A\n",
777
- "\n",
778
- "model-00002-of-00003.safetensors: 56%|█████▋ | 2.81G/4.98G [00:49<00:40, 53.5MB/s]\u001b[A\u001b[A\n",
779
- "model-00001-of-00003.safetensors: 50%|█████ | 2.51G/4.98G [00:49<00:48, 51.1MB/s]\u001b[A\n",
780
- "model-00001-of-00003.safetensors: 51%|█████ | 2.52G/4.98G [00:49<00:45, 54.7MB/s]\u001b[A\n",
781
- "\n",
782
- "model-00002-of-00003.safetensors: 57%|█████▋ | 2.82G/4.98G [00:49<00:39, 55.4MB/s]\u001b[A\u001b[A\n",
783
- "model-00001-of-00003.safetensors: 51%|█████ | 2.54G/4.98G [00:50<00:41, 58.9MB/s]\u001b[A\n",
784
- "\n",
785
- "model-00002-of-00003.safetensors: 57%|█████▋ | 2.84G/4.98G [00:50<00:42, 50.6MB/s]\u001b[A\u001b[A\n",
786
- "\n",
787
- "model-00002-of-00003.safetensors: 57%|█████▋ | 2.85G/4.98G [00:50<00:44, 47.9MB/s]\u001b[A\u001b[A\n",
788
- "model-00001-of-00003.safetensors: 51%|█████ | 2.55G/4.98G [00:50<00:54, 44.4MB/s]\u001b[A\n",
789
- "model-00001-of-00003.safetensors: 52%|█████▏ | 2.57G/4.98G [00:50<00:43, 55.0MB/s]\u001b[A\n",
790
- "model-00001-of-00003.safetensors: 52%|█████▏ | 2.58G/4.98G [00:50<00:44, 53.7MB/s]\u001b[A\n",
791
- "\n",
792
- "model-00002-of-00003.safetensors: 58%|█████▊ | 2.87G/4.98G [00:50<00:49, 42.3MB/s]\u001b[A\u001b[A\n",
793
- "\n",
794
- "model-00002-of-00003.safetensors: 58%|█████▊ | 2.89G/4.98G [00:51<00:35, 58.2MB/s]\u001b[A\u001b[A\n",
795
- "model-00001-of-00003.safetensors: 52%|█████▏ | 2.60G/4.98G [00:51<00:44, 54.0MB/s]\u001b[A\n",
796
- "\n",
797
- "model-00002-of-00003.safetensors: 58%|█████▊ | 2.90G/4.98G [00:51<00:43, 47.9MB/s]\u001b[A\u001b[A\n",
798
- "model-00001-of-00003.safetensors: 52%|█████▏ | 2.61G/4.98G [00:51<00:45, 51.7MB/s]\u001b[A\n",
799
- "\n",
800
- "model-00002-of-00003.safetensors: 59%|█████▊ | 2.92G/4.98G [00:51<00:41, 49.8MB/s]\u001b[A\u001b[A\n",
801
- "model-00001-of-00003.safetensors: 53%|█████▎ | 2.63G/4.98G [00:51<00:43, 54.6MB/s]\u001b[A\n",
802
- "\n",
803
- "model-00002-of-00003.safetensors: 59%|█████▉ | 2.94G/4.98G [00:51<00:32, 62.3MB/s]\u001b[A\u001b[A\n",
804
- "model-00001-of-00003.safetensors: 53%|█████▎ | 2.64G/4.98G [00:52<00:40, 57.5MB/s]\u001b[A\n",
805
- "\n",
806
- "model-00002-of-00003.safetensors: 59%|█████▉ | 2.95G/4.98G [00:52<00:37, 54.4MB/s]\u001b[A\u001b[A\n",
807
- "model-00001-of-00003.safetensors: 53%|█████▎ | 2.65G/4.98G [00:52<00:47, 49.0MB/s]\u001b[A\n",
808
- "model-00001-of-00003.safetensors: 53%|█████▎ | 2.66G/4.98G [00:52<00:42, 54.4MB/s]\u001b[A\n",
809
- "\n",
810
- "model-00002-of-00003.safetensors: 60%|█████▉ | 2.97G/4.98G [00:52<00:38, 52.1MB/s]\u001b[A\u001b[A\n",
811
- "model-00001-of-00003.safetensors: 54%|█████▎ | 2.67G/4.98G [00:52<00:48, 47.1MB/s]\u001b[A\n",
812
- "\n",
813
- "model-00002-of-00003.safetensors: 60%|█████▉ | 2.98G/4.98G [00:52<00:38, 51.6MB/s]\u001b[A\u001b[A\n",
814
- "model-00001-of-00003.safetensors: 54%|█████▍ | 2.69G/4.98G [00:53<00:39, 57.3MB/s]\u001b[A\n",
815
- "model-00001-of-00003.safetensors: 54%|█████▍ | 2.71G/4.98G [00:53<00:42, 53.5MB/s]\u001b[A\n",
816
- "\n",
817
- "model-00002-of-00003.safetensors: 60%|█████▉ | 2.99G/4.98G [00:53<00:53, 37.6MB/s]\u001b[A\u001b[A\n",
818
- "model-00001-of-00003.safetensors: 55%|█████▍ | 2.73G/4.98G [00:53<00:40, 55.8MB/s]\u001b[A\n",
819
- "model-00001-of-00003.safetensors: 55%|█████▍ | 2.74G/4.98G [00:53<00:38, 58.2MB/s]\u001b[A\n",
820
- "\n",
821
- "model-00002-of-00003.safetensors: 60%|██████ | 3.00G/4.98G [00:54<01:15, 26.3MB/s]\u001b[A\u001b[A\n",
822
- "model-00001-of-00003.safetensors: 55%|█████▌ | 2.76G/4.98G [00:54<00:36, 60.6MB/s]\u001b[A\n",
823
- "\n",
824
- "model-00002-of-00003.safetensors: 60%|██████ | 3.01G/4.98G [00:54<01:00, 32.5MB/s]\u001b[A\u001b[A\n",
825
- "model-00001-of-00003.safetensors: 56%|█████▌ | 2.77G/4.98G [00:54<00:39, 55.8MB/s]\u001b[A\n",
826
- "model-00001-of-00003.safetensors: 56%|█████▌ | 2.79G/4.98G [00:54<00:31, 68.8MB/s]\u001b[A\n",
827
- "\n",
828
- "model-00002-of-00003.safetensors: 61%|██████ | 3.03G/4.98G [00:54<00:47, 40.9MB/s]\u001b[A\u001b[A\n",
829
- "model-00001-of-00003.safetensors: 56%|█████▌ | 2.80G/4.98G [00:54<00:33, 65.2MB/s]\u001b[A\n",
830
- "model-00001-of-00003.safetensors: 56%|█████▋ | 2.81G/4.98G [00:54<00:34, 63.7MB/s]\u001b[A\n",
831
- "model-00001-of-00003.safetensors: 57%|█████▋ | 2.82G/4.98G [00:55<00:32, 66.4MB/s]\u001b[A\n",
832
- "\n",
833
- "model-00002-of-00003.safetensors: 61%|██████ | 3.04G/4.98G [00:55<01:01, 31.4MB/s]\u001b[A\u001b[A\n",
834
- "model-00001-of-00003.safetensors: 57%|█████▋ | 2.84G/4.98G [00:55<00:30, 70.3MB/s]\u001b[A\n",
835
- "\n",
836
- "model-00002-of-00003.safetensors: 61%|██████▏ | 3.06G/4.98G [00:55<00:43, 44.0MB/s]\u001b[A\u001b[A\n",
837
- "model-00001-of-00003.safetensors: 57%|█████▋ | 2.85G/4.98G [00:55<00:35, 60.6MB/s]\u001b[A\n",
838
- "\n",
839
- "model-00002-of-00003.safetensors: 62%|██████▏ | 3.07G/4.98G [00:55<00:50, 38.0MB/s]\u001b[A\u001b[A\n",
840
- "model-00001-of-00003.safetensors: 58%|█████▊ | 2.87G/4.98G [00:55<00:33, 63.4MB/s]\u001b[A\n",
841
- "\n",
842
- "model-00002-of-00003.safetensors: 62%|██████▏ | 3.08G/4.98G [00:55<00:44, 42.3MB/s]\u001b[A\u001b[A\n",
843
- "model-00001-of-00003.safetensors: 58%|█████▊ | 2.88G/4.98G [00:55<00:30, 68.2MB/s]\u001b[A\n",
844
- "\n",
845
- "model-00002-of-00003.safetensors: 62%|██████▏ | 3.09G/4.98G [00:55<00:39, 47.7MB/s]\u001b[A\u001b[A\n",
846
- "\n",
847
- "model-00002-of-00003.safetensors: 62%|██████▏ | 3.10G/4.98G [00:56<00:34, 54.4MB/s]\u001b[A\u001b[A\n",
848
- "model-00001-of-00003.safetensors: 58%|█████▊ | 2.90G/4.98G [00:56<00:27, 76.3MB/s]\u001b[A\n",
849
- "\n",
850
- "model-00002-of-00003.safetensors: 63%|██████▎ | 3.11G/4.98G [00:56<00:34, 54.1MB/s]\u001b[A\u001b[A\n",
851
- "model-00001-of-00003.safetensors: 59%|█████▊ | 2.92G/4.98G [00:56<00:31, 66.5MB/s]\u001b[A\n",
852
- "\n",
853
- "model-00002-of-00003.safetensors: 63%|██████▎ | 3.12G/4.98G [00:56<00:31, 59.4MB/s]\u001b[A\u001b[A\n",
854
- "\n",
855
- "model-00002-of-00003.safetensors: 63%|██████▎ | 3.15G/4.98G [00:56<00:29, 62.9MB/s]\u001b[A\u001b[A\n",
856
- "\n",
857
- "model-00002-of-00003.safetensors: 64%|██████▎ | 3.17G/4.98G [00:56<00:22, 82.3MB/s]\u001b[A\u001b[A\n",
858
- "model-00001-of-00003.safetensors: 59%|█████▉ | 2.94G/4.98G [00:56<00:37, 54.7MB/s]\u001b[A\n",
859
- "\n",
860
- "model-00002-of-00003.safetensors: 64%|██████▍ | 3.18G/4.98G [00:56<00:21, 85.1MB/s]\u001b[A\u001b[A\n",
861
- "model-00001-of-00003.safetensors: 59%|█████▉ | 2.95G/4.98G [00:57<00:35, 57.5MB/s]\u001b[A\n",
862
- "\n",
863
- "model-00002-of-00003.safetensors: 64%|██████▍ | 3.19G/4.98G [00:57<00:20, 87.9MB/s]\u001b[A\u001b[A\n",
864
- "model-00001-of-00003.safetensors: 60%|█████▉ | 2.97G/4.98G [00:57<00:34, 58.6MB/s]\u001b[A\n",
865
- "\n",
866
- "model-00002-of-00003.safetensors: 64%|██████▍ | 3.21G/4.98G [00:57<00:23, 76.9MB/s]\u001b[A\u001b[A\n",
867
- "model-00001-of-00003.safetensors: 60%|█████▉ | 2.98G/4.98G [00:57<00:35, 55.8MB/s]\u001b[A\n",
868
- "\n",
869
- "model-00002-of-00003.safetensors: 65%|██████▍ | 3.22G/4.98G [00:57<00:27, 64.2MB/s]\u001b[A\u001b[A\n",
870
- "\n",
871
- "model-00002-of-00003.safetensors: 65%|██████▍ | 3.23G/4.98G [00:57<00:26, 66.6MB/s]\u001b[A\u001b[A\n",
872
- "\n",
873
- "model-00002-of-00003.safetensors: 65%|██████▌ | 3.24G/4.98G [00:57<00:27, 62.3MB/s]\u001b[A\u001b[A\n",
874
- "model-00001-of-00003.safetensors: 60%|██████ | 3.00G/4.98G [00:58<00:39, 49.9MB/s]\u001b[A\n",
875
- "\n",
876
- "model-00002-of-00003.safetensors: 65%|██████▌ | 3.25G/4.98G [00:58<00:35, 48.5MB/s]\u001b[A\u001b[A\n",
877
- "model-00001-of-00003.safetensors: 60%|██████ | 3.01G/4.98G [00:58<00:42, 46.5MB/s]\u001b[A\n",
878
- "\n",
879
- "model-00002-of-00003.safetensors: 65%|██████▌ | 3.26G/4.98G [00:58<00:45, 38.2MB/s]\u001b[A\u001b[A\n",
880
- "model-00001-of-00003.safetensors: 61%|██████ | 3.03G/4.98G [00:58<00:40, 47.8MB/s]\u001b[A\n",
881
- "\n",
882
- "model-00002-of-00003.safetensors: 66%|██████▌ | 3.27G/4.98G [00:59<00:49, 34.8MB/s]\u001b[A\u001b[A\n",
883
- "model-00001-of-00003.safetensors: 61%|██████ | 3.04G/4.98G [00:59<00:50, 38.8MB/s]\u001b[A\n",
884
- "\n",
885
- "model-00002-of-00003.safetensors: 66%|██████▌ | 3.28G/4.98G [00:59<00:48, 34.7MB/s]\u001b[A\u001b[A\n",
886
- "model-00001-of-00003.safetensors: 61%|██████ | 3.05G/4.98G [00:59<00:56, 34.3MB/s]\u001b[A\n",
887
- "\n",
888
- "model-00002-of-00003.safetensors: 66%|██████▋ | 3.30G/4.98G [00:59<00:39, 42.6MB/s]\u001b[A\u001b[A\n",
889
- "model-00001-of-00003.safetensors: 61%|██████▏ | 3.06G/4.98G [00:59<00:49, 38.9MB/s]\u001b[A\n",
890
- "model-00001-of-00003.safetensors: 62%|██████▏ | 3.07G/4.98G [01:00<00:45, 41.8MB/s]\u001b[A\n",
891
- "\n",
892
- "model-00002-of-00003.safetensors: 67%|██████▋ | 3.31G/4.98G [01:00<00:40, 41.3MB/s]\u001b[A\u001b[A\n",
893
- "\n",
894
- "model-00002-of-00003.safetensors: 67%|██████▋ | 3.33G/4.98G [01:00<00:30, 54.2MB/s]\u001b[A\u001b[A\n",
895
- "\n",
896
- "model-00002-of-00003.safetensors: 67%|██████▋ | 3.34G/4.98G [01:00<00:29, 54.8MB/s]\u001b[A\u001b[A\n",
897
- "model-00001-of-00003.safetensors: 62%|██████▏ | 3.09G/4.98G [01:00<00:47, 39.6MB/s]\u001b[A\n",
898
- "\n",
899
- "model-00002-of-00003.safetensors: 68%|██████▊ | 3.37G/4.98G [01:00<00:26, 61.1MB/s]\u001b[A\u001b[A\n",
900
- "model-00001-of-00003.safetensors: 63%|██████▎ | 3.11G/4.98G [01:00<00:37, 50.2MB/s]\u001b[A\n",
901
- "\n",
902
- "model-00002-of-00003.safetensors: 68%|██████▊ | 3.39G/4.98G [01:00<00:20, 79.3MB/s]\u001b[A\u001b[A\n",
903
- "\n",
904
- "model-00002-of-00003.safetensors: 68%|██████▊ | 3.40G/4.98G [01:01<00:20, 76.9MB/s]\u001b[A\u001b[A\n",
905
- "model-00001-of-00003.safetensors: 63%|██████▎ | 3.12G/4.98G [01:01<00:37, 49.1MB/s]\u001b[A\n",
906
- "model-00001-of-00003.safetensors: 63%|██████▎ | 3.14G/4.98G [01:01<00:33, 55.2MB/s]\u001b[A\n",
907
- "\n",
908
- "model-00002-of-00003.safetensors: 69%|██████▊ | 3.42G/4.98G [01:01<00:18, 82.6MB/s]\u001b[A\u001b[A\n",
909
- "model-00001-of-00003.safetensors: 63%|██████▎ | 3.15G/4.98G [01:01<00:40, 45.3MB/s]\u001b[A\n",
910
- "\n",
911
- "model-00002-of-00003.safetensors: 69%|██████▉ | 3.43G/4.98G [01:01<00:24, 63.2MB/s]\u001b[A\u001b[A\n",
912
- "model-00001-of-00003.safetensors: 63%|██████▎ | 3.16G/4.98G [01:01<00:37, 48.3MB/s]\u001b[A\n",
913
- "\n",
914
- "model-00002-of-00003.safetensors: 69%|██████▉ | 3.45G/4.98G [01:01<00:21, 69.7MB/s]\u001b[A\u001b[A\n",
915
- "model-00001-of-00003.safetensors: 64%|██████▍ | 3.18G/4.98G [01:02<00:32, 56.1MB/s]\u001b[A\n",
916
- "\n",
917
- "model-00002-of-00003.safetensors: 69%|██████▉ | 3.46G/4.98G [01:02<00:25, 58.6MB/s]\u001b[A\u001b[A\n",
918
- "model-00001-of-00003.safetensors: 64%|██████▍ | 3.19G/4.98G [01:02<00:32, 55.5MB/s]\u001b[A\n",
919
- "\n",
920
- "model-00002-of-00003.safetensors: 70%|██████▉ | 3.47G/4.98G [01:02<00:27, 55.6MB/s]\u001b[A\u001b[A\n",
921
- "model-00001-of-00003.safetensors: 64%|██████▍ | 3.20G/4.98G [01:02<00:30, 57.7MB/s]\u001b[A\n",
922
- "model-00001-of-00003.safetensors: 64%|██████▍ | 3.21G/4.98G [01:02<00:31, 57.2MB/s]\u001b[A\n",
923
- "\n",
924
- "model-00002-of-00003.safetensors: 70%|██████▉ | 3.48G/4.98G [01:02<00:29, 50.2MB/s]\u001b[A\u001b[A\n",
925
- "model-00001-of-00003.safetensors: 65%|██████▍ | 3.22G/4.98G [01:02<00:28, 61.9MB/s]\u001b[A\n",
926
- "model-00001-of-00003.safetensors: 65%|██████▌ | 3.24G/4.98G [01:03<00:26, 64.7MB/s]\u001b[A\n",
927
- "\n",
928
- "model-00002-of-00003.safetensors: 70%|███████ | 3.49G/4.98G [01:02<00:37, 40.0MB/s]\u001b[A\u001b[A\n",
929
- "model-00001-of-00003.safetensors: 65%|██████▌ | 3.25G/4.98G [01:03<00:25, 68.5MB/s]\u001b[A\n",
930
- "\n",
931
- "model-00002-of-00003.safetensors: 71%|███████ | 3.51G/4.98G [01:03<00:26, 54.8MB/s]\u001b[A\u001b[A\n",
932
- "model-00001-of-00003.safetensors: 66%|██████▌ | 3.27G/4.98G [01:03<00:20, 83.3MB/s]\u001b[A\n",
933
- "\n",
934
- "model-00002-of-00003.safetensors: 71%|███████ | 3.52G/4.98G [01:03<00:27, 52.4MB/s]\u001b[A\u001b[A\n",
935
- "model-00001-of-00003.safetensors: 66%|██████▌ | 3.28G/4.98G [01:03<00:23, 72.0MB/s]\u001b[A\n",
936
- "model-00001-of-00003.safetensors: 66%|██████▋ | 3.30G/4.98G [01:03<00:20, 81.1MB/s]\u001b[A\n",
937
- "\n",
938
- "model-00002-of-00003.safetensors: 71%|███████ | 3.54G/4.98G [01:03<00:25, 55.9MB/s]\u001b[A\u001b[A\n",
939
- "model-00001-of-00003.safetensors: 67%|██████▋ | 3.31G/4.98G [01:03<00:23, 71.8MB/s]\u001b[A\n",
940
- "model-00001-of-00003.safetensors: 67%|██████▋ | 3.33G/4.98G [01:04<00:21, 76.1MB/s]\u001b[A\n",
941
- "\n",
942
- "model-00002-of-00003.safetensors: 71%|███████▏ | 3.55G/4.98G [01:04<00:32, 44.5MB/s]\u001b[A\u001b[A\n",
943
- "\n",
944
- "model-00002-of-00003.safetensors: 72%|███████▏ | 3.57G/4.98G [01:04<00:29, 47.3MB/s]\u001b[A\u001b[A\n",
945
- "model-00001-of-00003.safetensors: 67%|██████▋ | 3.34G/4.98G [01:04<00:25, 63.2MB/s]\u001b[A\n",
946
- "\n",
947
- "model-00002-of-00003.safetensors: 72%|███████▏ | 3.58G/4.98G [01:04<00:27, 51.8MB/s]\u001b[A\u001b[A\n",
948
- "\n",
949
- "model-00002-of-00003.safetensors: 72%|███████▏ | 3.59G/4.98G [01:04<00:26, 53.2MB/s]\u001b[A\u001b[A\n",
950
- "model-00001-of-00003.safetensors: 68%|██████▊ | 3.37G/4.98G [01:04<00:24, 66.1MB/s]\u001b[A\n",
951
- "\n",
952
- "model-00002-of-00003.safetensors: 72%|███████▏ | 3.60G/4.98G [01:04<00:27, 50.6MB/s]\u001b[A\u001b[A\n",
953
- "model-00001-of-00003.safetensors: 68%|██████▊ | 3.38G/4.98G [01:04<00:26, 60.9MB/s]\u001b[A\n",
954
- "\n",
955
- "model-00002-of-00003.safetensors: 72%|███████▏ | 3.61G/4.98G [01:05<00:27, 50.8MB/s]\u001b[A\u001b[A\n",
956
- "model-00001-of-00003.safetensors: 68%|██████▊ | 3.40G/4.98G [01:05<00:30, 52.4MB/s]\u001b[A\n",
957
- "\n",
958
- "model-00002-of-00003.safetensors: 73%|███████▎ | 3.62G/4.98G [01:05<00:32, 41.8MB/s]\u001b[A\u001b[A\n",
959
- "model-00001-of-00003.safetensors: 68%|██████▊ | 3.41G/4.98G [01:05<00:32, 48.1MB/s]\u001b[A\n",
960
- "\n",
961
- "model-00002-of-00003.safetensors: 73%|███████▎ | 3.64G/4.98G [01:05<00:25, 52.3MB/s]\u001b[A\u001b[A\n",
962
- "model-00001-of-00003.safetensors: 69%|██████▊ | 3.42G/4.98G [01:05<00:31, 50.3MB/s]\u001b[A\n",
963
- "\n",
964
- "model-00002-of-00003.safetensors: 73%|███████▎ | 3.65G/4.98G [01:05<00:26, 50.8MB/s]\u001b[A\u001b[A\n",
965
- "model-00001-of-00003.safetensors: 69%|██████▉ | 3.43G/4.98G [01:06<00:36, 42.9MB/s]\u001b[A\n",
966
- "\n",
967
- "model-00002-of-00003.safetensors: 74%|███████▎ | 3.67G/4.98G [01:06<00:23, 55.1MB/s]\u001b[A\u001b[A\n",
968
- "model-00001-of-00003.safetensors: 69%|██████▉ | 3.45G/4.98G [01:06<00:26, 58.5MB/s]\u001b[A\n",
969
- "\n",
970
- "model-00002-of-00003.safetensors: 74%|███████▍ | 3.68G/4.98G [01:06<00:26, 48.4MB/s]\u001b[A\u001b[A\n",
971
- "model-00001-of-00003.safetensors: 69%|██████▉ | 3.46G/4.98G [01:06<00:26, 56.4MB/s]\u001b[A\n",
972
- "model-00001-of-00003.safetensors: 70%|██████▉ | 3.47G/4.98G [01:06<00:25, 59.9MB/s]\u001b[A\n",
973
- "\n",
974
- "model-00002-of-00003.safetensors: 74%|███████▍ | 3.70G/4.98G [01:06<00:23, 55.0MB/s]\u001b[A\u001b[A\n",
975
- "model-00001-of-00003.safetensors: 70%|██████▉ | 3.48G/4.98G [01:07<00:28, 52.7MB/s]\u001b[A\n",
976
- "\n",
977
- "model-00002-of-00003.safetensors: 74%|███████▍ | 3.71G/4.98G [01:07<00:24, 52.0MB/s]\u001b[A\u001b[A\n",
978
- "\n",
979
- "model-00002-of-00003.safetensors: 75%|███████▍ | 3.72G/4.98G [01:07<00:22, 55.7MB/s]\u001b[A\u001b[A\n",
980
- "model-00001-of-00003.safetensors: 70%|███████ | 3.49G/4.98G [01:07<00:40, 36.7MB/s]\u001b[A\n",
981
- "\n",
982
- "model-00002-of-00003.safetensors: 75%|███████▍ | 3.73G/4.98G [01:07<00:25, 49.0MB/s]\u001b[A\u001b[A\n",
983
- "\n",
984
- "model-00002-of-00003.safetensors: 75%|███████▌ | 3.74G/4.98G [01:07<00:24, 51.3MB/s]\u001b[A\u001b[A\n",
985
- "model-00001-of-00003.safetensors: 71%|███████ | 3.51G/4.98G [01:07<00:33, 43.3MB/s]\u001b[A\n",
986
- "\n",
987
- "model-00002-of-00003.safetensors: 75%|███████▌ | 3.75G/4.98G [01:07<00:24, 50.2MB/s]\u001b[A\u001b[A\n",
988
- "\n",
989
- "model-00002-of-00003.safetensors: 76%|███████▌ | 3.76G/4.98G [01:08<00:21, 55.6MB/s]\u001b[A\u001b[A\n",
990
- "model-00001-of-00003.safetensors: 71%|███████ | 3.52G/4.98G [01:08<00:33, 44.0MB/s]\u001b[A\n",
991
- "model-00001-of-00003.safetensors: 71%|███████ | 3.54G/4.98G [01:08<00:28, 50.8MB/s]\u001b[A\n",
992
- "\n",
993
- "model-00002-of-00003.safetensors: 76%|███████▌ | 3.79G/4.98G [01:08<00:23, 50.9MB/s]\u001b[A\u001b[A\n",
994
- "\n",
995
- "model-00002-of-00003.safetensors: 76%|███████▌ | 3.80G/4.98G [01:08<00:24, 48.8MB/s]\u001b[A\u001b[A\n",
996
- "model-00001-of-00003.safetensors: 71%|███████▏ | 3.55G/4.98G [01:09<00:37, 38.3MB/s]\u001b[A\n",
997
- "\n",
998
- "model-00002-of-00003.safetensors: 77%|███████▋ | 3.82G/4.98G [01:09<00:18, 62.7MB/s]\u001b[A\u001b[A\n",
999
- "model-00001-of-00003.safetensors: 72%|███████▏ | 3.57G/4.98G [01:09<00:32, 43.8MB/s]\u001b[A\n",
1000
- "\n",
1001
- "model-00002-of-00003.safetensors: 77%|███████▋ | 3.83G/4.98G [01:09<00:19, 58.1MB/s]\u001b[A\u001b[A\n",
1002
- "model-00001-of-00003.safetensors: 72%|███████▏ | 3.58G/4.98G [01:09<00:31, 44.2MB/s]\u001b[A\n",
1003
- "model-00001-of-00003.safetensors: 72%|███████▏ | 3.59G/4.98G [01:09<00:28, 49.5MB/s]\u001b[A\n",
1004
- "\n",
1005
- "model-00002-of-00003.safetensors: 77%|███████▋ | 3.85G/4.98G [01:09<00:18, 59.8MB/s]\u001b[A\u001b[A\n",
1006
- "\n",
1007
- "model-00002-of-00003.safetensors: 77%|███████▋ | 3.86G/4.98G [01:09<00:22, 48.9MB/s]\u001b[A\u001b[A\n",
1008
- "model-00001-of-00003.safetensors: 72%|███████▏ | 3.61G/4.98G [01:10<00:32, 42.0MB/s]\u001b[A\n",
1009
- "\n",
1010
- "model-00002-of-00003.safetensors: 78%|███████▊ | 3.89G/4.98G [01:10<00:14, 73.6MB/s]\u001b[A\u001b[A\n",
1011
- "model-00001-of-00003.safetensors: 73%|███████▎ | 3.62G/4.98G [01:10<00:34, 39.1MB/s]\u001b[A\n",
1012
- "\n",
1013
- "model-00002-of-00003.safetensors: 78%|███████▊ | 3.91G/4.98G [01:10<00:16, 64.8MB/s]\u001b[A\u001b[A\n",
1014
- "\n",
1015
- "model-00002-of-00003.safetensors: 79%|███████▊ | 3.92G/4.98G [01:10<00:17, 61.5MB/s]\u001b[A\u001b[A\n",
1016
- "model-00001-of-00003.safetensors: 73%|███████▎ | 3.64G/4.98G [01:10<00:30, 44.2MB/s]\u001b[A\n",
1017
- "model-00001-of-00003.safetensors: 73%|███████▎ | 3.65G/4.98G [01:11<00:30, 43.3MB/s]\u001b[A\n",
1018
- "\n",
1019
- "model-00002-of-00003.safetensors: 79%|███████▉ | 3.94G/4.98G [01:11<00:18, 56.2MB/s]\u001b[A\u001b[A\n",
1020
- "\n",
1021
- "model-00002-of-00003.safetensors: 79%|███████▉ | 3.95G/4.98G [01:11<00:18, 56.3MB/s]\u001b[A\u001b[A\n",
1022
- "\n",
1023
- "model-00002-of-00003.safetensors: 80%|███████▉ | 3.97G/4.98G [01:11<00:15, 64.8MB/s]\u001b[A\u001b[A\n",
1024
- "model-00001-of-00003.safetensors: 74%|███████▎ | 3.67G/4.98G [01:11<00:32, 40.7MB/s]\u001b[A\n",
1025
- "model-00001-of-00003.safetensors: 74%|███████▍ | 3.70G/4.98G [01:11<00:21, 60.4MB/s]\u001b[A\n",
1026
- "model-00001-of-00003.safetensors: 75%|███████▍ | 3.71G/4.98G [01:12<00:20, 61.7MB/s]\u001b[A\n",
1027
- "\n",
1028
- "model-00002-of-00003.safetensors: 80%|███████▉ | 3.98G/4.98G [01:11<00:19, 50.4MB/s]\u001b[A\u001b[A\n",
1029
- "\n",
1030
- "model-00002-of-00003.safetensors: 80%|████████ | 4.01G/4.98G [01:12<00:18, 52.7MB/s]\u001b[A\u001b[A\n",
1031
- "model-00001-of-00003.safetensors: 75%|███████▍ | 3.72G/4.98G [01:12<00:30, 41.2MB/s]\u001b[A\n",
1032
- "\n",
1033
- "model-00002-of-00003.safetensors: 81%|████████ | 4.02G/4.98G [01:12<00:19, 48.9MB/s]\u001b[A\u001b[A\n",
1034
- "model-00001-of-00003.safetensors: 75%|███████▍ | 3.73G/4.98G [01:12<00:32, 38.7MB/s]\u001b[A\n",
1035
- "\n",
1036
- "model-00002-of-00003.safetensors: 81%|████████ | 4.04G/4.98G [01:13<00:18, 49.8MB/s]\u001b[A\u001b[A\n",
1037
- "model-00001-of-00003.safetensors: 75%|███████▌ | 3.75G/4.98G [01:13<00:23, 51.9MB/s]\u001b[A\n",
1038
- "model-00001-of-00003.safetensors: 76%|███████▌ | 3.76G/4.98G [01:13<00:22, 55.1MB/s]\u001b[A\n",
1039
- "\n",
1040
- "model-00002-of-00003.safetensors: 81%|████████▏ | 4.06G/4.98G [01:13<00:15, 60.3MB/s]\u001b[A\u001b[A\n",
1041
- "\n",
1042
- "model-00002-of-00003.safetensors: 82%|████████▏ | 4.07G/4.98G [01:13<00:17, 52.9MB/s]\u001b[A\u001b[A\n",
1043
- "model-00001-of-00003.safetensors: 76%|███████▌ | 3.79G/4.98G [01:13<00:20, 58.7MB/s]\u001b[A\n",
1044
- "model-00001-of-00003.safetensors: 76%|███████▌ | 3.80G/4.98G [01:13<00:21, 55.7MB/s]\u001b[A\n",
1045
- "\n",
1046
- "model-00002-of-00003.safetensors: 82%|████████▏ | 4.09G/4.98G [01:13<00:14, 60.8MB/s]\u001b[A\u001b[A\n",
1047
- "model-00001-of-00003.safetensors: 76%|███████▋ | 3.81G/4.98G [01:13<00:19, 60.4MB/s]\u001b[A\n",
1048
- "model-00001-of-00003.safetensors: 77%|███████▋ | 3.82G/4.98G [01:14<00:18, 62.2MB/s]\u001b[A\n",
1049
- "\n",
1050
- "model-00002-of-00003.safetensors: 82%|████████▏ | 4.10G/4.98G [01:14<00:16, 54.3MB/s]\u001b[A\u001b[A\n",
1051
- "\n",
1052
- "model-00002-of-00003.safetensors: 83%|████████▎ | 4.12G/4.98G [01:14<00:13, 65.5MB/s]\u001b[A\u001b[A\n",
1053
- "model-00001-of-00003.safetensors: 77%|███████▋ | 3.83G/4.98G [01:14<00:25, 45.1MB/s]\u001b[A\n",
1054
- "\n",
1055
- "model-00002-of-00003.safetensors: 83%|████████▎ | 4.13G/4.98G [01:14<00:17, 49.4MB/s]\u001b[A\u001b[A\n",
1056
- "model-00001-of-00003.safetensors: 77%|███████▋ | 3.85G/4.98G [01:14<00:22, 51.0MB/s]\u001b[A\n",
1057
- "\n",
1058
- "model-00002-of-00003.safetensors: 83%|████████▎ | 4.14G/4.98G [01:14<00:16, 50.5MB/s]\u001b[A\u001b[A\n",
1059
- "model-00001-of-00003.safetensors: 77%|███████▋ | 3.86G/4.98G [01:15<00:22, 50.4MB/s]\u001b[A\n",
1060
- "\n",
1061
- "model-00002-of-00003.safetensors: 83%|████████▎ | 4.15G/4.98G [01:15<00:15, 52.9MB/s]\u001b[A\u001b[A\n",
1062
- "model-00001-of-00003.safetensors: 78%|███████▊ | 3.87G/4.98G [01:15<00:24, 46.1MB/s]\u001b[A\n",
1063
- "\n",
1064
- "model-00002-of-00003.safetensors: 84%|████████▎ | 4.16G/4.98G [01:15<00:17, 47.3MB/s]\u001b[A\u001b[A\n",
1065
- "model-00001-of-00003.safetensors: 78%|███████▊ | 3.88G/4.98G [01:15<00:21, 51.0MB/s]\u001b[A\n",
1066
- "\n",
1067
- "model-00002-of-00003.safetensors: 84%|████████▍ | 4.18G/4.98G [01:15<00:12, 66.2MB/s]\u001b[A\u001b[A\n",
1068
- "\n",
1069
- "model-00002-of-00003.safetensors: 84%|████████▍ | 4.19G/4.98G [01:15<00:13, 56.7MB/s]\u001b[A\u001b[A\n",
1070
- "model-00001-of-00003.safetensors: 78%|███████▊ | 3.89G/4.98G [01:15<00:24, 44.0MB/s]\u001b[A\n",
1071
- "\n",
1072
- "model-00002-of-00003.safetensors: 85%|████████▍ | 4.22G/4.98G [01:15<00:10, 73.9MB/s]\u001b[A\u001b[A\n",
1073
- "model-00001-of-00003.safetensors: 79%|███████▊ | 3.91G/4.98G [01:16<00:19, 55.8MB/s]\u001b[A\n",
1074
- "\n",
1075
- "model-00002-of-00003.safetensors: 85%|████████▍ | 4.23G/4.98G [01:16<00:10, 70.7MB/s]\u001b[A\u001b[A\n",
1076
- "model-00001-of-00003.safetensors: 79%|███████▊ | 3.92G/4.98G [01:16<00:20, 52.7MB/s]\u001b[A\n",
1077
- "model-00001-of-00003.safetensors: 79%|███████▉ | 3.93G/4.98G [01:16<00:18, 56.4MB/s]\u001b[A\n",
1078
- "model-00001-of-00003.safetensors: 79%|███████▉ | 3.94G/4.98G [01:16<00:19, 53.4MB/s]\u001b[A\n",
1079
- "\n",
1080
- "model-00002-of-00003.safetensors: 85%|████████▌ | 4.25G/4.98G [01:16<00:14, 51.4MB/s]\u001b[A\u001b[A\n",
1081
- "model-00001-of-00003.safetensors: 79%|███████▉ | 3.95G/4.98G [01:16<00:19, 52.9MB/s]\u001b[A\n",
1082
- "\n",
1083
- "model-00002-of-00003.safetensors: 85%|████████▌ | 4.26G/4.98G [01:16<00:15, 45.7MB/s]\u001b[A\u001b[A\n",
1084
- "model-00001-of-00003.safetensors: 80%|███████▉ | 3.97G/4.98G [01:17<00:18, 54.1MB/s]\u001b[A\n",
1085
- "\n",
1086
- "model-00002-of-00003.safetensors: 86%|████████▌ | 4.28G/4.98G [01:17<00:13, 50.8MB/s]\u001b[A\u001b[A\n",
1087
- "model-00001-of-00003.safetensors: 80%|███████▉ | 3.98G/4.98G [01:17<00:17, 55.7MB/s]\u001b[A\n",
1088
- "\n",
1089
- "model-00002-of-00003.safetensors: 86%|████████▌ | 4.29G/4.98G [01:17<00:14, 48.0MB/s]\u001b[A\u001b[A\n",
1090
- "model-00001-of-00003.safetensors: 80%|████████ | 4.01G/4.98G [01:17<00:14, 67.9MB/s]\u001b[A\n",
1091
- "model-00001-of-00003.safetensors: 81%|████████ | 4.02G/4.98G [01:17<00:14, 64.8MB/s]\u001b[A\n",
1092
- "\n",
1093
- "model-00002-of-00003.safetensors: 86%|████████▋ | 4.31G/4.98G [01:18<00:13, 49.0MB/s]\u001b[A\u001b[A\n",
1094
- "\n",
1095
- "model-00002-of-00003.safetensors: 87%|████████▋ | 4.32G/4.98G [01:18<00:13, 49.3MB/s]\u001b[A\u001b[A\n",
1096
- "model-00001-of-00003.safetensors: 81%|████████ | 4.04G/4.98G [01:18<00:17, 53.6MB/s]\u001b[A\n",
1097
- "\n",
1098
- "model-00002-of-00003.safetensors: 87%|████████▋ | 4.34G/4.98G [01:18<00:12, 49.4MB/s]\u001b[A\u001b[A\n",
1099
- "model-00001-of-00003.safetensors: 81%|████████ | 4.05G/4.98G [01:18<00:20, 45.0MB/s]\u001b[A\n",
1100
- "model-00001-of-00003.safetensors: 81%|████████▏ | 4.06G/4.98G [01:18<00:18, 49.4MB/s]\u001b[A\n",
1101
- "\n",
1102
- "model-00002-of-00003.safetensors: 88%|████████▊ | 4.36G/4.98G [01:18<00:11, 54.4MB/s]\u001b[A\u001b[A\n",
1103
- "model-00001-of-00003.safetensors: 82%|████████▏ | 4.07G/4.98G [01:19<00:20, 44.6MB/s]\u001b[A\n",
1104
- "\n",
1105
- "model-00002-of-00003.safetensors: 88%|████████▊ | 4.37G/4.98G [01:19<00:12, 49.8MB/s]\u001b[A\u001b[A\n",
1106
- "\n",
1107
- "model-00002-of-00003.safetensors: 88%|████████▊ | 4.38G/4.98G [01:19<00:11, 52.3MB/s]\u001b[A\u001b[A\n",
1108
- "model-00001-of-00003.safetensors: 82%|████████▏ | 4.09G/4.98G [01:19<00:20, 43.2MB/s]\u001b[A\n",
1109
- "\n",
1110
- "model-00002-of-00003.safetensors: 88%|████████▊ | 4.39G/4.98G [01:19<00:11, 51.8MB/s]\u001b[A\u001b[A\n",
1111
- "\n",
1112
- "model-00002-of-00003.safetensors: 88%|████████▊ | 4.40G/4.98G [01:19<00:11, 51.5MB/s]\u001b[A\u001b[A\n",
1113
- "\n",
1114
- "model-00002-of-00003.safetensors: 89%|████████▉ | 4.42G/4.98G [01:19<00:08, 67.1MB/s]\u001b[A\u001b[A\n",
1115
- "model-00001-of-00003.safetensors: 82%|████████▏ | 4.10G/4.98G [01:20<00:23, 37.3MB/s]\u001b[A\n",
1116
- "\n",
1117
- "model-00002-of-00003.safetensors: 89%|████████▉ | 4.44G/4.98G [01:20<00:09, 58.4MB/s]\u001b[A\u001b[A\n",
1118
- "\n",
1119
- "model-00002-of-00003.safetensors: 89%|████████▉ | 4.46G/4.98G [01:20<00:07, 71.1MB/s]\u001b[A\u001b[A\n",
1120
- "model-00001-of-00003.safetensors: 83%|████████▎ | 4.12G/4.98G [01:20<00:22, 39.0MB/s]\u001b[A\n",
1121
- "\n",
1122
- "model-00002-of-00003.safetensors: 90%|████████▉ | 4.47G/4.98G [01:20<00:07, 68.7MB/s]\u001b[A\u001b[A\n",
1123
- "model-00001-of-00003.safetensors: 83%|████████▎ | 4.13G/4.98G [01:20<00:19, 42.9MB/s]\u001b[A\n",
1124
- "\n",
1125
- "model-00002-of-00003.safetensors: 90%|████████▉ | 4.48G/4.98G [01:20<00:06, 73.3MB/s]\u001b[A\u001b[A\n",
1126
- "\n",
1127
- "model-00002-of-00003.safetensors: 90%|█████████ | 4.49G/4.98G [01:20<00:07, 69.2MB/s]\u001b[A\u001b[A\n",
1128
- "model-00001-of-00003.safetensors: 83%|████████▎ | 4.15G/4.98G [01:21<00:16, 50.1MB/s]\u001b[A\n",
1129
- "\n",
1130
- "model-00002-of-00003.safetensors: 90%|█████████ | 4.50G/4.98G [01:21<00:08, 56.6MB/s]\u001b[A\u001b[A\n",
1131
- "model-00001-of-00003.safetensors: 84%|████████▎ | 4.16G/4.98G [01:21<00:16, 48.6MB/s]\u001b[A\n",
1132
- "\n",
1133
- "model-00002-of-00003.safetensors: 91%|█████████ | 4.52G/4.98G [01:21<00:07, 62.4MB/s]\u001b[A\u001b[A\n",
1134
- "model-00001-of-00003.safetensors: 84%|████████▍ | 4.18G/4.98G [01:21<00:15, 52.0MB/s]\u001b[A\n",
1135
- "\n",
1136
- "model-00002-of-00003.safetensors: 91%|█████████ | 4.53G/4.98G [01:21<00:06, 68.4MB/s]\u001b[A\u001b[A\n",
1137
- "model-00001-of-00003.safetensors: 84%|████████▍ | 4.19G/4.98G [01:21<00:14, 54.5MB/s]\u001b[A\n",
1138
- "\n",
1139
- "model-00002-of-00003.safetensors: 91%|█████████▏| 4.55G/4.98G [01:21<00:06, 68.6MB/s]\u001b[A\u001b[A\n",
1140
- "\n",
1141
- "model-00002-of-00003.safetensors: 92%|█████████▏| 4.56G/4.98G [01:22<00:06, 69.3MB/s]\u001b[A\u001b[A\n",
1142
- "\n",
1143
- "model-00002-of-00003.safetensors: 92%|█████████▏| 4.57G/4.98G [01:22<00:05, 72.9MB/s]\u001b[A\u001b[A\n",
1144
- "model-00001-of-00003.safetensors: 85%|████████▍ | 4.22G/4.98G [01:22<00:16, 46.3MB/s]\u001b[A\n",
1145
- "\n",
1146
- "model-00002-of-00003.safetensors: 92%|█████████▏| 4.58G/4.98G [01:22<00:06, 66.7MB/s]\u001b[A\u001b[A\n",
1147
- "\n",
1148
- "model-00002-of-00003.safetensors: 92%|█████████▏| 4.59G/4.98G [01:22<00:05, 69.3MB/s]\u001b[A\u001b[A\n",
1149
- "model-00001-of-00003.safetensors: 85%|████████▍ | 4.23G/4.98G [01:22<00:17, 42.2MB/s]\u001b[A\n",
1150
- "\n",
1151
- "model-00002-of-00003.safetensors: 93%|█████████▎| 4.61G/4.98G [01:22<00:05, 69.2MB/s]\u001b[A\u001b[A\n",
1152
- "model-00001-of-00003.safetensors: 85%|████████▌ | 4.25G/4.98G [01:22<00:14, 51.6MB/s]\u001b[A\n",
1153
- "\n",
1154
- "model-00002-of-00003.safetensors: 93%|█████████▎| 4.62G/4.98G [01:22<00:05, 67.6MB/s]\u001b[A\u001b[A\n",
1155
- "model-00001-of-00003.safetensors: 85%|████████▌ | 4.26G/4.98G [01:23<00:14, 50.4MB/s]\u001b[A\n",
1156
- "\n",
1157
- "model-00002-of-00003.safetensors: 93%|█████████▎| 4.65G/4.98G [01:23<00:04, 80.9MB/s]\u001b[A\u001b[A\n",
1158
- "model-00001-of-00003.safetensors: 86%|████████▌ | 4.28G/4.98G [01:23<00:11, 63.1MB/s]\u001b[A\n",
1159
- "\n",
1160
- "model-00002-of-00003.safetensors: 94%|█████████▎| 4.67G/4.98G [01:23<00:03, 86.5MB/s]\u001b[A\u001b[A\n",
1161
- "model-00001-of-00003.safetensors: 86%|████████▌ | 4.29G/4.98G [01:23<00:12, 55.3MB/s]\u001b[A\n",
1162
- "\n",
1163
- "model-00002-of-00003.safetensors: 94%|█████████▍| 4.68G/4.98G [01:23<00:04, 61.9MB/s]\u001b[A\u001b[A\n",
1164
- "model-00001-of-00003.safetensors: 86%|████████▋ | 4.31G/4.98G [01:23<00:10, 65.8MB/s]\u001b[A\n",
1165
- "\n",
1166
- "model-00002-of-00003.safetensors: 94%|█████████▍| 4.69G/4.98G [01:23<00:04, 61.9MB/s]\u001b[A\u001b[A\n",
1167
- "\n",
1168
- "model-00002-of-00003.safetensors: 94%|█████████▍| 4.70G/4.98G [01:24<00:04, 62.7MB/s]\u001b[A\u001b[A\n",
1169
- "model-00001-of-00003.safetensors: 87%|████████▋ | 4.32G/4.98G [01:24<00:12, 54.2MB/s]\u001b[A\n",
1170
- "model-00001-of-00003.safetensors: 87%|████████▋ | 4.34G/4.98G [01:24<00:10, 61.2MB/s]\u001b[A\n",
1171
- "\n",
1172
- "model-00002-of-00003.safetensors: 94%|█████████▍| 4.71G/4.98G [01:24<00:06, 43.7MB/s]\u001b[A\u001b[A\n",
1173
- "model-00001-of-00003.safetensors: 87%|████████▋ | 4.35G/4.98G [01:24<00:10, 57.4MB/s]\u001b[A\n",
1174
- "model-00001-of-00003.safetensors: 88%|████████▊ | 4.36G/4.98G [01:24<00:10, 61.0MB/s]\u001b[A\n",
1175
- "\n",
1176
- "model-00002-of-00003.safetensors: 95%|█████████▍| 4.73G/4.98G [01:24<00:05, 47.1MB/s]\u001b[A\u001b[A\n",
1177
- "model-00001-of-00003.safetensors: 88%|████████▊ | 4.37G/4.98G [01:25<00:10, 56.1MB/s]\u001b[A\n",
1178
- "\n",
1179
- "model-00002-of-00003.safetensors: 95%|█████████▌| 4.74G/4.98G [01:25<00:05, 42.0MB/s]\u001b[A\u001b[A\n",
1180
- "model-00001-of-00003.safetensors: 88%|████████▊ | 4.38G/4.98G [01:25<00:13, 44.1MB/s]\u001b[A\n",
1181
- "\n",
1182
- "model-00002-of-00003.safetensors: 95%|█████████▌| 4.75G/4.98G [01:25<00:05, 44.7MB/s]\u001b[A\u001b[A\n",
1183
- "model-00001-of-00003.safetensors: 88%|████████▊ | 4.39G/4.98G [01:25<00:12, 47.3MB/s]\u001b[A\n",
1184
- "\n",
1185
- "model-00002-of-00003.safetensors: 96%|█████████▌| 4.76G/4.98G [01:25<00:04, 44.8MB/s]\u001b[A\u001b[A\n",
1186
- "model-00001-of-00003.safetensors: 88%|████████▊ | 4.40G/4.98G [01:25<00:12, 45.0MB/s]\u001b[A\n",
1187
- "\n",
1188
- "model-00002-of-00003.safetensors: 96%|█████████▌| 4.77G/4.98G [01:25<00:04, 45.1MB/s]\u001b[A\u001b[A\n",
1189
- "\n",
1190
- "model-00002-of-00003.safetensors: 96%|█████████▌| 4.79G/4.98G [01:26<00:03, 58.4MB/s]\u001b[A\u001b[A\n",
1191
- "model-00001-of-00003.safetensors: 89%|████████▉ | 4.42G/4.98G [01:26<00:12, 44.8MB/s]\u001b[A\n",
1192
- "\n",
1193
- "model-00002-of-00003.safetensors: 96%|█████████▋| 4.80G/4.98G [01:26<00:03, 50.2MB/s]\u001b[A\u001b[A\n",
1194
- "model-00001-of-00003.safetensors: 89%|████████▉ | 4.44G/4.98G [01:26<00:11, 48.7MB/s]\u001b[A\n",
1195
- "\n",
1196
- "model-00002-of-00003.safetensors: 97%|█████████▋| 4.81G/4.98G [01:26<00:03, 55.1MB/s]\u001b[A\u001b[A\n",
1197
- "\n",
1198
- "model-00002-of-00003.safetensors: 97%|█████████▋| 4.82G/4.98G [01:26<00:02, 60.6MB/s]\u001b[A\u001b[A\n",
1199
- "model-00001-of-00003.safetensors: 89%|████████▉ | 4.46G/4.98G [01:26<00:10, 50.0MB/s]\u001b[A\n",
1200
- "\n",
1201
- "model-00002-of-00003.safetensors: 97%|█████████▋| 4.83G/4.98G [01:26<00:02, 50.3MB/s]\u001b[A\u001b[A\n",
1202
- "model-00001-of-00003.safetensors: 90%|████████▉ | 4.47G/4.98G [01:27<00:11, 45.4MB/s]\u001b[A\n",
1203
- "\n",
1204
- "model-00002-of-00003.safetensors: 97%|█████████▋| 4.85G/4.98G [01:27<00:02, 61.7MB/s]\u001b[A\u001b[A\n",
1205
- "\n",
1206
- "model-00002-of-00003.safetensors: 98%|█████████▊| 4.87G/4.98G [01:27<00:01, 64.6MB/s]\u001b[A\u001b[A\n",
1207
- "model-00001-of-00003.safetensors: 90%|█████████ | 4.49G/4.98G [01:27<00:08, 56.3MB/s]\u001b[A\n",
1208
- "\n",
1209
- "model-00002-of-00003.safetensors: 98%|█████████▊| 4.89G/4.98G [01:27<00:01, 75.8MB/s]\u001b[A\u001b[A\n",
1210
- "\n",
1211
- "model-00002-of-00003.safetensors: 98%|█████████▊| 4.90G/4.98G [01:27<00:01, 65.1MB/s]\u001b[A\u001b[A\n",
1212
- "model-00001-of-00003.safetensors: 90%|█████████ | 4.50G/4.98G [01:27<00:11, 41.5MB/s]\u001b[A\n",
1213
- "model-00001-of-00003.safetensors: 91%|█████████ | 4.52G/4.98G [01:28<00:08, 56.4MB/s]\u001b[A\n",
1214
- "\n",
1215
- "model-00002-of-00003.safetensors: 99%|█████████▊| 4.92G/4.98G [01:28<00:00, 67.9MB/s]\u001b[A\u001b[A\n",
1216
- "model-00001-of-00003.safetensors: 91%|█████████ | 4.53G/4.98G [01:28<00:07, 57.4MB/s]\u001b[A\n",
1217
- "model-00001-of-00003.safetensors: 91%|█████████▏| 4.55G/4.98G [01:28<00:05, 72.4MB/s]\u001b[A\n",
1218
- "\n",
1219
- "model-00002-of-00003.safetensors: 99%|█████████▉| 4.93G/4.98G [01:28<00:00, 54.6MB/s]\u001b[A\u001b[A\n",
1220
- "model-00001-of-00003.safetensors: 92%|█████████▏| 4.56G/4.98G [01:28<00:05, 73.0MB/s]\u001b[A\n",
1221
- "\n",
1222
- "model-00002-of-00003.safetensors: 99%|█████████▉| 4.95G/4.98G [01:28<00:00, 63.3MB/s]\u001b[A\u001b[A\n",
1223
- "model-00001-of-00003.safetensors: 92%|█████████▏| 4.58G/4.98G [01:28<00:04, 80.1MB/s]\u001b[A\n",
1224
- "\n",
1225
- "model-00002-of-00003.safetensors: 100%|█████████▉| 4.96G/4.98G [01:28<00:00, 63.9MB/s]\u001b[A\u001b[A\n",
1226
- "\n",
1227
- "model-00002-of-00003.safetensors: 100%|█████████▉| 4.97G/4.98G [01:29<00:00, 59.7MB/s]\u001b[A\u001b[A\n",
1228
- "model-00001-of-00003.safetensors: 92%|█████████▏| 4.59G/4.98G [01:29<00:06, 59.6MB/s]\u001b[A\n",
1229
- "\n",
1230
- "model-00002-of-00003.safetensors: 100%|██████████| 4.98G/4.98G [01:29<00:00, 55.9MB/s]\u001b[A\u001b[A\n",
1231
- "\n",
1232
- "model-00001-of-00003.safetensors: 93%|█████████▎| 4.61G/4.98G [01:29<00:05, 62.2MB/s]\u001b[A\n",
1233
- "model-00001-of-00003.safetensors: 93%|█████████▎| 4.62G/4.98G [01:29<00:06, 57.7MB/s]\u001b[A\n",
1234
- "model-00001-of-00003.safetensors: 93%|█████████▎| 4.65G/4.98G [01:29<00:05, 65.2MB/s]\u001b[A\n",
1235
- "model-00001-of-00003.safetensors: 93%|█████████▎| 4.66G/4.98G [01:30<00:05, 64.6MB/s]\u001b[A\n",
1236
- "model-00001-of-00003.safetensors: 94%|█████████▎| 4.67G/4.98G [01:30<00:04, 65.1MB/s]\u001b[A\n",
1237
- "model-00001-of-00003.safetensors: 94%|█████████▍| 4.68G/4.98G [01:30<00:05, 60.3MB/s]\u001b[A\n",
1238
- "model-00001-of-00003.safetensors: 94%|█████████▍| 4.70G/4.98G [01:30<00:04, 60.8MB/s]\u001b[A\n",
1239
- "model-00001-of-00003.safetensors: 94%|█████████▍| 4.71G/4.98G [01:30<00:04, 62.1MB/s]\u001b[A\n",
1240
- "model-00001-of-00003.safetensors: 95%|█████████▍| 4.73G/4.98G [01:31<00:03, 73.0MB/s]\u001b[A\n",
1241
- "model-00001-of-00003.safetensors: 95%|█████████▌| 4.74G/4.98G [01:31<00:03, 75.3MB/s]\u001b[A\n",
1242
- "model-00001-of-00003.safetensors: 96%|█████████▌| 4.76G/4.98G [01:31<00:02, 85.7MB/s]\u001b[A\n",
1243
- "model-00001-of-00003.safetensors: 96%|█████████▌| 4.77G/4.98G [01:31<00:03, 60.2MB/s]\u001b[A\n",
1244
- "model-00001-of-00003.safetensors: 96%|█████████▌| 4.78G/4.98G [01:32<00:03, 52.4MB/s]\u001b[A\n",
1245
- "model-00001-of-00003.safetensors: 96%|█████████▌| 4.79G/4.98G [01:32<00:03, 56.1MB/s]\u001b[A\n",
1246
- "model-00001-of-00003.safetensors: 96%|█████████▋| 4.80G/4.98G [01:32<00:04, 44.7MB/s]\u001b[A\n",
1247
- "model-00001-of-00003.safetensors: 97%|█████████▋| 4.82G/4.98G [01:32<00:02, 58.1MB/s]\u001b[A\n",
1248
- "model-00001-of-00003.safetensors: 97%|█████████▋| 4.83G/4.98G [01:33<00:02, 54.4MB/s]\u001b[A\n",
1249
- "model-00001-of-00003.safetensors: 97%|█████████▋| 4.85G/4.98G [01:33<00:02, 51.5MB/s]\u001b[A\n",
1250
- "model-00001-of-00003.safetensors: 98%|█████████▊| 4.87G/4.98G [01:33<00:02, 44.7MB/s]\u001b[A\n",
1251
- "model-00001-of-00003.safetensors: 98%|█████████▊| 4.88G/4.98G [01:34<00:02, 45.1MB/s]\u001b[A\n",
1252
- "model-00001-of-00003.safetensors: 98%|█████████▊| 4.89G/4.98G [01:34<00:01, 52.4MB/s]\u001b[A\n",
1253
- "model-00001-of-00003.safetensors: 98%|█████████▊| 4.90G/4.98G [01:34<00:01, 55.3MB/s]\u001b[A\n",
1254
- "model-00001-of-00003.safetensors: 98%|█████████▊| 4.91G/4.98G [01:34<00:01, 57.0MB/s]\u001b[A\n",
1255
- "model-00001-of-00003.safetensors: 99%|█████████▊| 4.92G/4.98G [01:34<00:01, 57.2MB/s]\u001b[A\n",
1256
- "model-00001-of-00003.safetensors: 99%|█████████▉| 4.93G/4.98G [01:34<00:00, 57.8MB/s]\u001b[A\n",
1257
- "model-00001-of-00003.safetensors: 99%|█████████▉| 4.95G/4.98G [01:35<00:00, 67.6MB/s]\u001b[A\n",
1258
- "model-00001-of-00003.safetensors: 100%|█████████▉| 4.96G/4.98G [01:35<00:00, 69.8MB/s]\u001b[A\n",
1259
- "model-00001-of-00003.safetensors: 100%|█████████▉| 4.97G/4.98G [01:35<00:00, 64.0MB/s]\u001b[A\n",
1260
- "model-00001-of-00003.safetensors: 100%|██████████| 4.98G/4.98G [01:35<00:00, 52.0MB/s]\u001b[A\n"
1261
  ]
1262
  },
1263
  {
1264
  "ename": "KeyError",
1265
- "evalue": "'base_model.model.base_model.model.model.layers.0.self_attn.qkv_proj.lora_A.weight'",
1266
  "output_type": "error",
1267
  "traceback": [
1268
  "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
1269
  "\u001b[0;31mKeyError\u001b[0m Traceback (most recent call last)",
1270
- "Cell \u001b[0;32mIn[4], line 4\u001b[0m\n\u001b[1;32m 2\u001b[0m base_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmicrosoft/phi-2\u001b[39m\u001b[38;5;124m'\u001b[39m\n\u001b[1;32m 3\u001b[0m merged_peft_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124maissatoubalde/lab\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m----> 4\u001b[0m llm \u001b[38;5;241m=\u001b[39m \u001b[43mLLM\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mmerged_peft_model_name\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtokenizer\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbase_model_name\u001b[49m\u001b[43m)\u001b[49m\n",
1271
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/entrypoints/llm.py:109\u001b[0m, in \u001b[0;36mLLM.__init__\u001b[0;34m(self, model, tokenizer, tokenizer_mode, trust_remote_code, tensor_parallel_size, dtype, quantization, revision, tokenizer_revision, seed, gpu_memory_utilization, swap_space, enforce_eager, max_context_len_to_capture, disable_custom_all_reduce, **kwargs)\u001b[0m\n\u001b[1;32m 90\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdisable_log_stats\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 91\u001b[0m engine_args \u001b[38;5;241m=\u001b[39m EngineArgs(\n\u001b[1;32m 92\u001b[0m model\u001b[38;5;241m=\u001b[39mmodel,\n\u001b[1;32m 93\u001b[0m tokenizer\u001b[38;5;241m=\u001b[39mtokenizer,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 107\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[1;32m 108\u001b[0m )\n\u001b[0;32m--> 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mllm_engine \u001b[38;5;241m=\u001b[39m \u001b[43mLLMEngine\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfrom_engine_args\u001b[49m\u001b[43m(\u001b[49m\u001b[43mengine_args\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mrequest_counter \u001b[38;5;241m=\u001b[39m Counter()\n",
1272
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:356\u001b[0m, in \u001b[0;36mLLMEngine.from_engine_args\u001b[0;34m(cls, engine_args)\u001b[0m\n\u001b[1;32m 354\u001b[0m placement_group \u001b[38;5;241m=\u001b[39m initialize_cluster(parallel_config)\n\u001b[1;32m 355\u001b[0m \u001b[38;5;66;03m# Create the LLM engine.\u001b[39;00m\n\u001b[0;32m--> 356\u001b[0m engine \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mcls\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mengine_configs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 357\u001b[0m \u001b[43m \u001b[49m\u001b[43mplacement_group\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 358\u001b[0m \u001b[43m \u001b[49m\u001b[43mlog_stats\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mengine_args\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdisable_log_stats\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 359\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m engine\n",
1273
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:111\u001b[0m, in \u001b[0;36mLLMEngine.__init__\u001b[0;34m(self, model_config, cache_config, parallel_config, scheduler_config, lora_config, placement_group, log_stats)\u001b[0m\n\u001b[1;32m 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_workers_ray(placement_group)\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 111\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_init_workers\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 113\u001b[0m \u001b[38;5;66;03m# Profile the memory usage and initialize the cache.\u001b[39;00m\n\u001b[1;32m 114\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_cache()\n",
@@ -1276,8 +283,8 @@
1276
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/worker.py:92\u001b[0m, in \u001b[0;36mWorker.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m):\n\u001b[0;32m---> 92\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_runner\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_model\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
1277
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/model_runner.py:75\u001b[0m, in \u001b[0;36mModelRunner.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m---> 75\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;241m=\u001b[39m \u001b[43mget_model\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_config\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlora_config\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 77\u001b[0m vocab_size \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mconfig\u001b[38;5;241m.\u001b[39mvocab_size\n\u001b[1;32m 79\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlora_config:\n",
1278
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/model_loader.py:88\u001b[0m, in \u001b[0;36mget_model\u001b[0;34m(model_config, lora_config)\u001b[0m\n\u001b[1;32m 85\u001b[0m initialize_dummy_weights(model)\n\u001b[1;32m 86\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 87\u001b[0m \u001b[38;5;66;03m# Load the weights from the cached or downloaded files.\u001b[39;00m\n\u001b[0;32m---> 88\u001b[0m \u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_weights\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_dir\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 89\u001b[0m \u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_format\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrevision\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 90\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m model\u001b[38;5;241m.\u001b[39meval()\n",
1279
- "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/models/phi.py:292\u001b[0m, in \u001b[0;36mPhiForCausalLM.load_weights\u001b[0;34m(self, model_name_or_path, cache_dir, load_format, revision)\u001b[0m\n\u001b[1;32m 290\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m name\u001b[38;5;241m.\u001b[39mendswith(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m.bias\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;129;01mand\u001b[39;00m name \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01min\u001b[39;00m params_dict:\n\u001b[1;32m 291\u001b[0m \u001b[38;5;28;01mcontinue\u001b[39;00m\n\u001b[0;32m--> 292\u001b[0m param \u001b[38;5;241m=\u001b[39m \u001b[43mparams_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[43mname\u001b[49m\u001b[43m]\u001b[49m\n\u001b[1;32m 293\u001b[0m weight_loader \u001b[38;5;241m=\u001b[39m param\u001b[38;5;241m.\u001b[39mweight_loader\n\u001b[1;32m 294\u001b[0m weight_loader(param, loaded_weight, shard_id)\n",
1280
- "\u001b[0;31mKeyError\u001b[0m: 'base_model.model.base_model.model.model.layers.0.self_attn.qkv_proj.lora_A.weight'"
1281
  ]
1282
  }
1283
  ],
 
225
  },
226
  {
227
  "cell_type": "code",
228
+ "execution_count": 5,
229
  "id": "75a61ec8-e440-42b0-8b4d-e3cb05841b71",
230
  "metadata": {},
231
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
232
  "source": [
233
  "import torch\n",
234
  "import numpy as np\n",
 
240
  },
241
  {
242
  "cell_type": "code",
243
+ "execution_count": 7,
244
  "id": "7d29ba48-d4b0-4f24-8f88-560d9bed100c",
245
  "metadata": {
246
  "scrolled": true
247
  },
248
  "outputs": [
 
 
 
 
 
 
 
249
  {
250
  "name": "stdout",
251
  "output_type": "stream",
252
  "text": [
253
+ "INFO 02-15 18:03:33 llm_engine.py:72] Initializing an LLM engine with config: model='aissatoubalde/lab', tokenizer='microsoft/phi-2', tokenizer_mode=auto, revision=None, tokenizer_revision=None, trust_remote_code=False, dtype=torch.float16, max_seq_len=2048, download_dir=None, load_format=auto, tensor_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=False, kv_cache_dtype=auto, seed=0)\n"
254
  ]
255
  },
256
  {
257
  "name": "stderr",
258
  "output_type": "stream",
259
  "text": [
 
260
  "Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
261
  ]
262
  },
 
264
  "name": "stdout",
265
  "output_type": "stream",
266
  "text": [
267
+ "INFO 02-15 18:03:33 weight_utils.py:164] Using model weights format ['*.safetensors']\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
268
  ]
269
  },
270
  {
271
  "ename": "KeyError",
272
+ "evalue": "'base_model.model.model.layers.0.mlp.fc1.lora_A.weight'",
273
  "output_type": "error",
274
  "traceback": [
275
  "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
276
  "\u001b[0;31mKeyError\u001b[0m Traceback (most recent call last)",
277
+ "Cell \u001b[0;32mIn[7], line 4\u001b[0m\n\u001b[1;32m 2\u001b[0m base_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmicrosoft/phi-2\u001b[39m\u001b[38;5;124m'\u001b[39m\n\u001b[1;32m 3\u001b[0m merged_peft_model_name\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124maissatoubalde/lab\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m----> 4\u001b[0m llm \u001b[38;5;241m=\u001b[39m \u001b[43mLLM\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mmerged_peft_model_name\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtokenizer\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mbase_model_name\u001b[49m\u001b[43m)\u001b[49m\n",
278
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/entrypoints/llm.py:109\u001b[0m, in \u001b[0;36mLLM.__init__\u001b[0;34m(self, model, tokenizer, tokenizer_mode, trust_remote_code, tensor_parallel_size, dtype, quantization, revision, tokenizer_revision, seed, gpu_memory_utilization, swap_space, enforce_eager, max_context_len_to_capture, disable_custom_all_reduce, **kwargs)\u001b[0m\n\u001b[1;32m 90\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdisable_log_stats\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 91\u001b[0m engine_args \u001b[38;5;241m=\u001b[39m EngineArgs(\n\u001b[1;32m 92\u001b[0m model\u001b[38;5;241m=\u001b[39mmodel,\n\u001b[1;32m 93\u001b[0m tokenizer\u001b[38;5;241m=\u001b[39mtokenizer,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 107\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[1;32m 108\u001b[0m )\n\u001b[0;32m--> 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mllm_engine \u001b[38;5;241m=\u001b[39m \u001b[43mLLMEngine\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfrom_engine_args\u001b[49m\u001b[43m(\u001b[49m\u001b[43mengine_args\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mrequest_counter \u001b[38;5;241m=\u001b[39m Counter()\n",
279
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:356\u001b[0m, in \u001b[0;36mLLMEngine.from_engine_args\u001b[0;34m(cls, engine_args)\u001b[0m\n\u001b[1;32m 354\u001b[0m placement_group \u001b[38;5;241m=\u001b[39m initialize_cluster(parallel_config)\n\u001b[1;32m 355\u001b[0m \u001b[38;5;66;03m# Create the LLM engine.\u001b[39;00m\n\u001b[0;32m--> 356\u001b[0m engine \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mcls\u001b[39;49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mengine_configs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 357\u001b[0m \u001b[43m \u001b[49m\u001b[43mplacement_group\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 358\u001b[0m \u001b[43m \u001b[49m\u001b[43mlog_stats\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[43mengine_args\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdisable_log_stats\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 359\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m engine\n",
280
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/engine/llm_engine.py:111\u001b[0m, in \u001b[0;36mLLMEngine.__init__\u001b[0;34m(self, model_config, cache_config, parallel_config, scheduler_config, lora_config, placement_group, log_stats)\u001b[0m\n\u001b[1;32m 109\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_workers_ray(placement_group)\n\u001b[1;32m 110\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 111\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_init_workers\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 113\u001b[0m \u001b[38;5;66;03m# Profile the memory usage and initialize the cache.\u001b[39;00m\n\u001b[1;32m 114\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_cache()\n",
 
283
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/worker.py:92\u001b[0m, in \u001b[0;36mWorker.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m):\n\u001b[0;32m---> 92\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_runner\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_model\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
284
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/worker/model_runner.py:75\u001b[0m, in \u001b[0;36mModelRunner.load_model\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 74\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mload_model\u001b[39m(\u001b[38;5;28mself\u001b[39m) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m---> 75\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;241m=\u001b[39m \u001b[43mget_model\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel_config\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlora_config\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 77\u001b[0m vocab_size \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mconfig\u001b[38;5;241m.\u001b[39mvocab_size\n\u001b[1;32m 79\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlora_config:\n",
285
  "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/model_loader.py:88\u001b[0m, in \u001b[0;36mget_model\u001b[0;34m(model_config, lora_config)\u001b[0m\n\u001b[1;32m 85\u001b[0m initialize_dummy_weights(model)\n\u001b[1;32m 86\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m 87\u001b[0m \u001b[38;5;66;03m# Load the weights from the cached or downloaded files.\u001b[39;00m\n\u001b[0;32m---> 88\u001b[0m \u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_weights\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdownload_dir\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m 89\u001b[0m \u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_format\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel_config\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrevision\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m 90\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m model\u001b[38;5;241m.\u001b[39meval()\n",
286
+ "File \u001b[0;32m/usr/local/lib/python3.11/site-packages/vllm/model_executor/models/phi.py:302\u001b[0m, in \u001b[0;36mPhiForCausalLM.load_weights\u001b[0;34m(self, model_name_or_path, cache_dir, load_format, revision)\u001b[0m\n\u001b[1;32m 299\u001b[0m \u001b[38;5;28;01mcontinue\u001b[39;00m\n\u001b[1;32m 300\u001b[0m \u001b[38;5;66;03m# pylint: disable=E1136\u001b[39;00m\n\u001b[0;32m--> 302\u001b[0m param \u001b[38;5;241m=\u001b[39m \u001b[43mparams_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[43mname\u001b[49m\u001b[43m]\u001b[49m\n\u001b[1;32m 303\u001b[0m weight_loader \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mgetattr\u001b[39m(param, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mweight_loader\u001b[39m\u001b[38;5;124m\"\u001b[39m,\n\u001b[1;32m 304\u001b[0m default_weight_loader)\n\u001b[1;32m 305\u001b[0m weight_loader(param, loaded_weight)\n",
287
+ "\u001b[0;31mKeyError\u001b[0m: 'base_model.model.model.layers.0.mlp.fc1.lora_A.weight'"
288
  ]
289
  }
290
  ],
phi-2-custom.ipynb CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b97f3e3a61f154dd18e7d0d40e91564daa7cfb393ad45e0eb1adf8bad6659cc5
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6c071b2811955d6107874169c939219fa3eadea899cc5d22b1dfc67183f694
3
  size 4664