karamjotsingh commited on
Commit
228155d
·
verified ·
1 Parent(s): bc40b5b

Upload position_ids_debug.ipynb with huggingface_hub

Browse files
Files changed (1) hide show
  1. position_ids_debug.ipynb +763 -675
position_ids_debug.ipynb CHANGED
@@ -293,15 +293,15 @@
293
  },
294
  {
295
  "cell_type": "code",
296
- "execution_count": 6,
297
  "id": "039f1456-ffa4-40b2-8ba1-a0cd5f74733e",
298
  "metadata": {
299
  "execution": {
300
- "iopub.execute_input": "2026-03-25T08:45:08.296250Z",
301
- "iopub.status.busy": "2026-03-25T08:45:08.296111Z",
302
- "iopub.status.idle": "2026-03-25T08:45:08.348040Z",
303
- "shell.execute_reply": "2026-03-25T08:45:08.347477Z",
304
- "shell.execute_reply.started": "2026-03-25T08:45:08.296237Z"
305
  },
306
  "scrolled": true
307
  },
@@ -310,682 +310,770 @@
310
  "name": "stdout",
311
  "output_type": "stream",
312
  "text": [
313
- "0 torch.Size([128])\n",
314
- " [0:16] 1.0 1.0\n",
315
- " [16:40] 1.0 1.0\n",
316
- " [40:64] 1.0 1.0\n",
317
- " [64:80] 1.0 1.0\n",
318
- " [80:104] 1.0 1.0\n",
319
- " [104:128] 1.0 1.0\n",
320
- "1 torch.Size([128])\n",
321
- " [0:16] 0.54052734375 0.9990234375\n",
322
- " [16:40] 0.99951171875 1.0\n",
323
- " [40:64] 1.0 1.0\n",
324
- " [64:80] 0.54052734375 0.9990234375\n",
325
- " [80:104] 0.99951171875 1.0\n",
326
- " [104:128] 1.0 1.0\n",
327
- "2 torch.Size([128])\n",
328
- " [0:16] -0.416259765625 0.9970703125\n",
329
- " [16:40] 0.998046875 1.0\n",
330
- " [40:64] 1.0 1.0\n",
331
- " [64:80] -0.416259765625 0.9970703125\n",
332
- " [80:104] 0.998046875 1.0\n",
333
- " [104:128] 1.0 1.0\n",
334
- "3 torch.Size([128])\n",
335
- " [0:16] -0.990234375 0.9931640625\n",
336
- " [16:40] 0.99560546875 1.0\n",
337
- " [40:64] 1.0 1.0\n",
338
- " [64:80] -0.990234375 0.9931640625\n",
339
- " [80:104] 0.99560546875 1.0\n",
340
- " [104:128] 1.0 1.0\n",
341
- "4 torch.Size([128])\n",
342
- " [0:16] -0.97314453125 0.98681640625\n",
343
- " [16:40] 0.9921875 1.0\n",
344
- " [40:64] 1.0 1.0\n",
345
- " [64:80] -0.97314453125 0.98681640625\n",
346
- " [80:104] 0.9921875 1.0\n",
347
- " [104:128] 1.0 1.0\n",
348
- "5 torch.Size([128])\n",
349
- " [0:16] -0.97314453125 0.98681640625\n",
350
- " [16:40] 0.9921875 1.0\n",
351
- " [40:64] 1.0 1.0\n",
352
- " [64:80] -0.97314453125 0.98681640625\n",
353
- " [80:104] 0.9921875 1.0\n",
354
- " [104:128] 1.0 1.0\n",
355
- "6 torch.Size([128])\n",
356
- " [0:16] -0.97314453125 0.98681640625\n",
357
- " [16:40] 0.9921875 1.0\n",
358
- " [40:64] 1.0 1.0\n",
359
- " [64:80] -0.97314453125 0.98681640625\n",
360
- " [80:104] 0.9921875 1.0\n",
361
- " [104:128] 1.0 1.0\n",
362
- "7 torch.Size([128])\n",
363
- " [0:16] -0.97314453125 0.98681640625\n",
364
- " [16:40] 0.9921875 1.0\n",
365
- " [40:64] 1.0 1.0\n",
366
- " [64:80] -0.97314453125 0.98681640625\n",
367
- " [80:104] 0.9921875 1.0\n",
368
- " [104:128] 1.0 1.0\n",
369
- "8 torch.Size([128])\n",
370
- " [0:16] -0.97314453125 0.98681640625\n",
371
- " [16:40] 0.9921875 1.0\n",
372
- " [40:64] 1.0 1.0\n",
373
- " [64:80] -0.97314453125 0.98681640625\n",
374
- " [80:104] 0.9921875 1.0\n",
375
- " [104:128] 1.0 1.0\n",
376
- "9 torch.Size([128])\n",
377
- " [0:16] -0.97314453125 0.98681640625\n",
378
- " [16:40] 0.9921875 1.0\n",
379
- " [40:64] 1.0 1.0\n",
380
- " [64:80] -0.97314453125 0.98681640625\n",
381
- " [80:104] 0.9921875 1.0\n",
382
- " [104:128] 1.0 1.0\n",
383
- "10 torch.Size([128])\n",
384
- " [0:16] -0.97314453125 0.98681640625\n",
385
- " [16:40] 0.9921875 1.0\n",
386
- " [40:64] 1.0 1.0\n",
387
- " [64:80] -0.97314453125 0.98681640625\n",
388
- " [80:104] 0.9921875 1.0\n",
389
- " [104:128] 1.0 1.0\n",
390
- "11 torch.Size([128])\n",
391
- " [0:16] -0.97314453125 0.98681640625\n",
392
- " [16:40] 0.9921875 1.0\n",
393
- " [40:64] 1.0 1.0\n",
394
- " [64:80] -0.97314453125 0.98681640625\n",
395
- " [80:104] 0.9921875 1.0\n",
396
- " [104:128] 1.0 1.0\n",
397
- "12 torch.Size([128])\n",
398
- " [0:16] -0.97314453125 0.98681640625\n",
399
- " [16:40] 0.9921875 1.0\n",
400
- " [40:64] 1.0 1.0\n",
401
- " [64:80] -0.97314453125 0.98681640625\n",
402
- " [80:104] 0.9921875 1.0\n",
403
- " [104:128] 1.0 1.0\n",
404
- "13 torch.Size([128])\n",
405
- " [0:16] -0.97314453125 0.98681640625\n",
406
- " [16:40] 0.9873046875 1.0\n",
407
- " [40:64] 1.0 1.0\n",
408
- " [64:80] -0.97314453125 0.98681640625\n",
409
- " [80:104] 0.9873046875 1.0\n",
410
- " [104:128] 1.0 1.0\n",
411
- "14 torch.Size([128])\n",
412
- " [0:16] -0.97314453125 0.98681640625\n",
413
- " [16:40] 0.9873046875 1.0\n",
414
- " [40:64] 1.0 1.0\n",
415
- " [64:80] -0.97314453125 0.98681640625\n",
416
- " [80:104] 0.9873046875 1.0\n",
417
- " [104:128] 1.0 1.0\n",
418
- "15 torch.Size([128])\n",
419
- " [0:16] -0.97314453125 0.98681640625\n",
420
- " [16:40] 0.9873046875 1.0\n",
421
- " [40:64] 1.0 1.0\n",
422
- " [64:80] -0.97314453125 0.98681640625\n",
423
- " [80:104] 0.9873046875 1.0\n",
424
- " [104:128] 1.0 1.0\n",
425
- "16 torch.Size([128])\n",
426
- " [0:16] -0.97314453125 0.98681640625\n",
427
- " [16:40] 0.9873046875 1.0\n",
428
- " [40:64] 1.0 1.0\n",
429
- " [64:80] -0.97314453125 0.98681640625\n",
430
- " [80:104] 0.9873046875 1.0\n",
431
- " [104:128] 1.0 1.0\n",
432
- "17 torch.Size([128])\n",
433
- " [0:16] -0.97314453125 0.98681640625\n",
434
- " [16:40] 0.9873046875 1.0\n",
435
- " [40:64] 1.0 1.0\n",
436
- " [64:80] -0.97314453125 0.98681640625\n",
437
- " [80:104] 0.9873046875 1.0\n",
438
- " [104:128] 1.0 1.0\n",
439
- "18 torch.Size([128])\n",
440
- " [0:16] -0.97314453125 0.98681640625\n",
441
- " [16:40] 0.9873046875 1.0\n",
442
- " [40:64] 1.0 1.0\n",
443
- " [64:80] -0.97314453125 0.98681640625\n",
444
- " [80:104] 0.9873046875 1.0\n",
445
- " [104:128] 1.0 1.0\n",
446
- "19 torch.Size([128])\n",
447
- " [0:16] -0.97314453125 0.98681640625\n",
448
- " [16:40] 0.9873046875 1.0\n",
449
- " [40:64] 1.0 1.0\n",
450
- " [64:80] -0.97314453125 0.98681640625\n",
451
- " [80:104] 0.9873046875 1.0\n",
452
- " [104:128] 1.0 1.0\n",
453
- "20 torch.Size([128])\n",
454
- " [0:16] -0.97314453125 0.98681640625\n",
455
- " [16:40] 0.9873046875 1.0\n",
456
- " [40:64] 1.0 1.0\n",
457
- " [64:80] -0.97314453125 0.98681640625\n",
458
- " [80:104] 0.9873046875 1.0\n",
459
- " [104:128] 1.0 1.0\n",
460
- "21 torch.Size([128])\n",
461
- " [0:16] -0.97314453125 0.98681640625\n",
462
- " [16:40] 0.9873046875 1.0\n",
463
- " [40:64] 1.0 1.0\n",
464
- " [64:80] -0.97314453125 0.98681640625\n",
465
- " [80:104] 0.9873046875 1.0\n",
466
- " [104:128] 1.0 1.0\n",
467
- "22 torch.Size([128])\n",
468
- " [0:16] -0.97314453125 0.98681640625\n",
469
- " [16:40] 0.98193359375 1.0\n",
470
- " [40:64] 1.0 1.0\n",
471
- " [64:80] -0.97314453125 0.98681640625\n",
472
- " [80:104] 0.98193359375 1.0\n",
473
- " [104:128] 1.0 1.0\n",
474
- "23 torch.Size([128])\n",
475
- " [0:16] -0.97314453125 0.98681640625\n",
476
- " [16:40] 0.98193359375 1.0\n",
477
- " [40:64] 1.0 1.0\n",
478
- " [64:80] -0.97314453125 0.98681640625\n",
479
- " [80:104] 0.98193359375 1.0\n",
480
- " [104:128] 1.0 1.0\n",
481
- "24 torch.Size([128])\n",
482
- " [0:16] -0.97314453125 0.98681640625\n",
483
- " [16:40] 0.98193359375 1.0\n",
484
- " [40:64] 1.0 1.0\n",
485
- " [64:80] -0.97314453125 0.98681640625\n",
486
- " [80:104] 0.98193359375 1.0\n",
487
- " [104:128] 1.0 1.0\n",
488
- "25 torch.Size([128])\n",
489
- " [0:16] -0.97314453125 0.98681640625\n",
490
- " [16:40] 0.98193359375 1.0\n",
491
- " [40:64] 1.0 1.0\n",
492
- " [64:80] -0.97314453125 0.98681640625\n",
493
- " [80:104] 0.98193359375 1.0\n",
494
- " [104:128] 1.0 1.0\n",
495
- "26 torch.Size([128])\n",
496
- " [0:16] -0.97314453125 0.98681640625\n",
497
- " [16:40] 0.98193359375 1.0\n",
498
- " [40:64] 1.0 1.0\n",
499
- " [64:80] -0.97314453125 0.98681640625\n",
500
- " [80:104] 0.98193359375 1.0\n",
501
- " [104:128] 1.0 1.0\n",
502
- "27 torch.Size([128])\n",
503
- " [0:16] -0.97314453125 0.98681640625\n",
504
- " [16:40] 0.98193359375 1.0\n",
505
- " [40:64] 1.0 1.0\n",
506
- " [64:80] -0.97314453125 0.98681640625\n",
507
- " [80:104] 0.98193359375 1.0\n",
508
- " [104:128] 1.0 1.0\n",
509
- "28 torch.Size([128])\n",
510
- " [0:16] -0.97314453125 0.98681640625\n",
511
- " [16:40] 0.98193359375 1.0\n",
512
- " [40:64] 1.0 1.0\n",
513
- " [64:80] -0.97314453125 0.98681640625\n",
514
- " [80:104] 0.98193359375 1.0\n",
515
- " [104:128] 1.0 1.0\n",
516
- "29 torch.Size([128])\n",
517
- " [0:16] -0.97314453125 0.98681640625\n",
518
- " [16:40] 0.98193359375 1.0\n",
519
- " [40:64] 1.0 1.0\n",
520
- " [64:80] -0.97314453125 0.98681640625\n",
521
- " [80:104] 0.98193359375 1.0\n",
522
- " [104:128] 1.0 1.0\n",
523
- "30 torch.Size([128])\n",
524
- " [0:16] -0.97314453125 0.98681640625\n",
525
- " [16:40] 0.98193359375 1.0\n",
526
- " [40:64] 1.0 1.0\n",
527
- " [64:80] -0.97314453125 0.98681640625\n",
528
- " [80:104] 0.98193359375 1.0\n",
529
- " [104:128] 1.0 1.0\n",
530
- "31 torch.Size([128])\n",
531
- " [0:16] -0.97314453125 0.98681640625\n",
532
- " [16:40] 0.9755859375 1.0\n",
533
- " [40:64] 1.0 1.0\n",
534
- " [64:80] -0.97314453125 0.98681640625\n",
535
- " [80:104] 0.9755859375 1.0\n",
536
- " [104:128] 1.0 1.0\n",
537
- "32 torch.Size([128])\n",
538
- " [0:16] -0.97314453125 0.98681640625\n",
539
- " [16:40] 0.9755859375 1.0\n",
540
- " [40:64] 1.0 1.0\n",
541
- " [64:80] -0.97314453125 0.98681640625\n",
542
- " [80:104] 0.9755859375 1.0\n",
543
- " [104:128] 1.0 1.0\n",
544
- "33 torch.Size([128])\n",
545
- " [0:16] -0.97314453125 0.98681640625\n",
546
- " [16:40] 0.9755859375 1.0\n",
547
- " [40:64] 1.0 1.0\n",
548
- " [64:80] -0.97314453125 0.98681640625\n",
549
- " [80:104] 0.9755859375 1.0\n",
550
- " [104:128] 1.0 1.0\n",
551
- "34 torch.Size([128])\n",
552
- " [0:16] -0.97314453125 0.98681640625\n",
553
- " [16:40] 0.9755859375 1.0\n",
554
- " [40:64] 1.0 1.0\n",
555
- " [64:80] -0.97314453125 0.98681640625\n",
556
- " [80:104] 0.9755859375 1.0\n",
557
- " [104:128] 1.0 1.0\n",
558
- "35 torch.Size([128])\n",
559
- " [0:16] -0.97314453125 0.98681640625\n",
560
- " [16:40] 0.9755859375 1.0\n",
561
- " [40:64] 1.0 1.0\n",
562
- " [64:80] -0.97314453125 0.98681640625\n",
563
- " [80:104] 0.9755859375 1.0\n",
564
- " [104:128] 1.0 1.0\n",
565
- "36 torch.Size([128])\n",
566
- " [0:16] -0.97314453125 0.98681640625\n",
567
- " [16:40] 0.9755859375 1.0\n",
568
- " [40:64] 1.0 1.0\n",
569
- " [64:80] -0.97314453125 0.98681640625\n",
570
- " [80:104] 0.9755859375 1.0\n",
571
- " [104:128] 1.0 1.0\n",
572
- "37 torch.Size([128])\n",
573
- " [0:16] -0.97314453125 0.98681640625\n",
574
- " [16:40] 0.9755859375 1.0\n",
575
- " [40:64] 1.0 1.0\n",
576
- " [64:80] -0.97314453125 0.98681640625\n",
577
- " [80:104] 0.9755859375 1.0\n",
578
- " [104:128] 1.0 1.0\n",
579
- "38 torch.Size([128])\n",
580
- " [0:16] -0.97314453125 0.98681640625\n",
581
- " [16:40] 0.9755859375 1.0\n",
582
- " [40:64] 1.0 1.0\n",
583
- " [64:80] -0.97314453125 0.98681640625\n",
584
- " [80:104] 0.9755859375 1.0\n",
585
- " [104:128] 1.0 1.0\n",
586
- "39 torch.Size([128])\n",
587
- " [0:16] -0.97314453125 0.98681640625\n",
588
- " [16:40] 0.9755859375 1.0\n",
589
- " [40:64] 1.0 1.0\n",
590
- " [64:80] -0.97314453125 0.98681640625\n",
591
- " [80:104] 0.9755859375 1.0\n",
592
- " [104:128] 1.0 1.0\n",
593
- "40 torch.Size([128])\n",
594
- " [0:16] -0.97314453125 0.98681640625\n",
595
- " [16:40] 0.96826171875 1.0\n",
596
- " [40:64] 1.0 1.0\n",
597
- " [64:80] -0.97314453125 0.98681640625\n",
598
- " [80:104] 0.96826171875 1.0\n",
599
- " [104:128] 1.0 1.0\n",
600
- "41 torch.Size([128])\n",
601
- " [0:16] -0.97314453125 0.98681640625\n",
602
- " [16:40] 0.96826171875 1.0\n",
603
- " [40:64] 1.0 1.0\n",
604
- " [64:80] -0.97314453125 0.98681640625\n",
605
- " [80:104] 0.96826171875 1.0\n",
606
- " [104:128] 1.0 1.0\n",
607
- "42 torch.Size([128])\n",
608
- " [0:16] -0.97314453125 0.98681640625\n",
609
- " [16:40] 0.96826171875 1.0\n",
610
- " [40:64] 1.0 1.0\n",
611
- " [64:80] -0.97314453125 0.98681640625\n",
612
- " [80:104] 0.96826171875 1.0\n",
613
- " [104:128] 1.0 1.0\n",
614
- "43 torch.Size([128])\n",
615
- " [0:16] -0.97314453125 0.98681640625\n",
616
- " [16:40] 0.96826171875 1.0\n",
617
- " [40:64] 1.0 1.0\n",
618
- " [64:80] -0.97314453125 0.98681640625\n",
619
- " [80:104] 0.96826171875 1.0\n",
620
- " [104:128] 1.0 1.0\n",
621
- "44 torch.Size([128])\n",
622
- " [0:16] -0.97314453125 0.98681640625\n",
623
- " [16:40] 0.96826171875 1.0\n",
624
- " [40:64] 1.0 1.0\n",
625
- " [64:80] -0.97314453125 0.98681640625\n",
626
- " [80:104] 0.96826171875 1.0\n",
627
- " [104:128] 1.0 1.0\n",
628
- "45 torch.Size([128])\n",
629
- " [0:16] -0.97314453125 0.98681640625\n",
630
- " [16:40] 0.96826171875 1.0\n",
631
- " [40:64] 1.0 1.0\n",
632
- " [64:80] -0.97314453125 0.98681640625\n",
633
- " [80:104] 0.96826171875 1.0\n",
634
- " [104:128] 1.0 1.0\n",
635
- "46 torch.Size([128])\n",
636
- " [0:16] -0.97314453125 0.98681640625\n",
637
- " [16:40] 0.96826171875 1.0\n",
638
- " [40:64] 1.0 1.0\n",
639
- " [64:80] -0.97314453125 0.98681640625\n",
640
- " [80:104] 0.96826171875 1.0\n",
641
- " [104:128] 1.0 1.0\n",
642
- "47 torch.Size([128])\n",
643
- " [0:16] -0.97314453125 0.98681640625\n",
644
- " [16:40] 0.96826171875 1.0\n",
645
- " [40:64] 1.0 1.0\n",
646
- " [64:80] -0.97314453125 0.98681640625\n",
647
- " [80:104] 0.96826171875 1.0\n",
648
- " [104:128] 1.0 1.0\n",
649
- "48 torch.Size([128])\n",
650
- " [0:16] -0.97314453125 0.98681640625\n",
651
- " [16:40] 0.96826171875 1.0\n",
652
- " [40:64] 1.0 1.0\n",
653
- " [64:80] -0.97314453125 0.98681640625\n",
654
- " [80:104] 0.96826171875 1.0\n",
655
- " [104:128] 1.0 1.0\n",
656
- "49 torch.Size([128])\n",
657
- " [0:16] -0.97314453125 0.98681640625\n",
658
- " [16:40] 0.9599609375 1.0\n",
659
- " [40:64] 1.0 1.0\n",
660
- " [64:80] -0.97314453125 0.98681640625\n",
661
- " [80:104] 0.9599609375 1.0\n",
662
- " [104:128] 1.0 1.0\n",
663
- "50 torch.Size([128])\n",
664
- " [0:16] -0.97314453125 0.98681640625\n",
665
- " [16:40] 0.9599609375 1.0\n",
666
- " [40:64] 1.0 1.0\n",
667
- " [64:80] -0.97314453125 0.98681640625\n",
668
- " [80:104] 0.9599609375 1.0\n",
669
- " [104:128] 1.0 1.0\n",
670
- "51 torch.Size([128])\n",
671
- " [0:16] -0.97314453125 0.98681640625\n",
672
- " [16:40] 0.9599609375 1.0\n",
673
- " [40:64] 1.0 1.0\n",
674
- " [64:80] -0.97314453125 0.98681640625\n",
675
- " [80:104] 0.9599609375 1.0\n",
676
- " [104:128] 1.0 1.0\n",
677
- "52 torch.Size([128])\n",
678
- " [0:16] -0.97314453125 0.98681640625\n",
679
- " [16:40] 0.9599609375 1.0\n",
680
- " [40:64] 1.0 1.0\n",
681
- " [64:80] -0.97314453125 0.98681640625\n",
682
- " [80:104] 0.9599609375 1.0\n",
683
- " [104:128] 1.0 1.0\n",
684
- "53 torch.Size([128])\n",
685
- " [0:16] -0.97314453125 0.98681640625\n",
686
- " [16:40] 0.9599609375 1.0\n",
687
- " [40:64] 1.0 1.0\n",
688
- " [64:80] -0.97314453125 0.98681640625\n",
689
- " [80:104] 0.9599609375 1.0\n",
690
- " [104:128] 1.0 1.0\n",
691
- "54 torch.Size([128])\n",
692
- " [0:16] -0.97314453125 0.98681640625\n",
693
- " [16:40] 0.9599609375 1.0\n",
694
- " [40:64] 1.0 1.0\n",
695
- " [64:80] -0.97314453125 0.98681640625\n",
696
- " [80:104] 0.9599609375 1.0\n",
697
- " [104:128] 1.0 1.0\n",
698
- "55 torch.Size([128])\n",
699
- " [0:16] -0.97314453125 0.98681640625\n",
700
- " [16:40] 0.9599609375 1.0\n",
701
- " [40:64] 1.0 1.0\n",
702
- " [64:80] -0.97314453125 0.98681640625\n",
703
- " [80:104] 0.9599609375 1.0\n",
704
- " [104:128] 1.0 1.0\n",
705
- "56 torch.Size([128])\n",
706
- " [0:16] -0.97314453125 0.98681640625\n",
707
- " [16:40] 0.9599609375 1.0\n",
708
- " [40:64] 1.0 1.0\n",
709
- " [64:80] -0.97314453125 0.98681640625\n",
710
- " [80:104] 0.9599609375 1.0\n",
711
- " [104:128] 1.0 1.0\n",
712
- "57 torch.Size([128])\n",
713
- " [0:16] -0.97314453125 0.98681640625\n",
714
- " [16:40] 0.9599609375 1.0\n",
715
- " [40:64] 1.0 1.0\n",
716
- " [64:80] -0.97314453125 0.98681640625\n",
717
- " [80:104] 0.9599609375 1.0\n",
718
- " [104:128] 1.0 1.0\n",
719
- "58 torch.Size([128])\n",
720
- " [0:16] -0.97314453125 0.98681640625\n",
721
- " [16:40] 0.9501953125 1.0\n",
722
- " [40:64] 1.0 1.0\n",
723
- " [64:80] -0.97314453125 0.98681640625\n",
724
- " [80:104] 0.9501953125 1.0\n",
725
- " [104:128] 1.0 1.0\n",
726
- "59 torch.Size([128])\n",
727
- " [0:16] -0.97314453125 0.98681640625\n",
728
- " [16:40] 0.9501953125 1.0\n",
729
- " [40:64] 1.0 1.0\n",
730
- " [64:80] -0.97314453125 0.98681640625\n",
731
- " [80:104] 0.9501953125 1.0\n",
732
- " [104:128] 1.0 1.0\n",
733
- "60 torch.Size([128])\n",
734
- " [0:16] -0.97314453125 0.98681640625\n",
735
- " [16:40] 0.9501953125 1.0\n",
736
- " [40:64] 1.0 1.0\n",
737
- " [64:80] -0.97314453125 0.98681640625\n",
738
- " [80:104] 0.9501953125 1.0\n",
739
- " [104:128] 1.0 1.0\n",
740
- "61 torch.Size([128])\n",
741
- " [0:16] -0.97314453125 0.98681640625\n",
742
- " [16:40] 0.9501953125 1.0\n",
743
- " [40:64] 1.0 1.0\n",
744
- " [64:80] -0.97314453125 0.98681640625\n",
745
- " [80:104] 0.9501953125 1.0\n",
746
- " [104:128] 1.0 1.0\n",
747
- "62 torch.Size([128])\n",
748
- " [0:16] -0.97314453125 0.98681640625\n",
749
- " [16:40] 0.9501953125 1.0\n",
750
- " [40:64] 1.0 1.0\n",
751
- " [64:80] -0.97314453125 0.98681640625\n",
752
- " [80:104] 0.9501953125 1.0\n",
753
- " [104:128] 1.0 1.0\n",
754
- "63 torch.Size([128])\n",
755
- " [0:16] -0.97314453125 0.98681640625\n",
756
- " [16:40] 0.9501953125 1.0\n",
757
- " [40:64] 1.0 1.0\n",
758
- " [64:80] -0.97314453125 0.98681640625\n",
759
- " [80:104] 0.9501953125 1.0\n",
760
- " [104:128] 1.0 1.0\n",
761
- "64 torch.Size([128])\n",
762
- " [0:16] -0.97314453125 0.98681640625\n",
763
- " [16:40] 0.9501953125 1.0\n",
764
- " [40:64] 1.0 1.0\n",
765
- " [64:80] -0.97314453125 0.98681640625\n",
766
- " [80:104] 0.9501953125 1.0\n",
767
- " [104:128] 1.0 1.0\n",
768
- "65 torch.Size([128])\n",
769
- " [0:16] -0.97314453125 0.98681640625\n",
770
- " [16:40] 0.9501953125 1.0\n",
771
- " [40:64] 1.0 1.0\n",
772
- " [64:80] -0.97314453125 0.98681640625\n",
773
- " [80:104] 0.9501953125 1.0\n",
774
- " [104:128] 1.0 1.0\n",
775
- "66 torch.Size([128])\n",
776
- " [0:16] -0.97314453125 0.98681640625\n",
777
- " [16:40] 0.9501953125 1.0\n",
778
- " [40:64] 1.0 1.0\n",
779
- " [64:80] -0.97314453125 0.98681640625\n",
780
- " [80:104] 0.9501953125 1.0\n",
781
- " [104:128] 1.0 1.0\n",
782
- "67 torch.Size([128])\n",
783
- " [0:16] -0.97314453125 0.98681640625\n",
784
- " [16:40] 0.93994140625 1.0\n",
785
- " [40:64] 1.0 1.0\n",
786
- " [64:80] -0.97314453125 0.98681640625\n",
787
- " [80:104] 0.93994140625 1.0\n",
788
- " [104:128] 1.0 1.0\n",
789
- "68 torch.Size([128])\n",
790
- " [0:16] -0.97314453125 0.98681640625\n",
791
- " [16:40] 0.93994140625 1.0\n",
792
- " [40:64] 1.0 1.0\n",
793
- " [64:80] -0.97314453125 0.98681640625\n",
794
- " [80:104] 0.93994140625 1.0\n",
795
- " [104:128] 1.0 1.0\n",
796
- "69 torch.Size([128])\n",
797
- " [0:16] -0.97314453125 0.98681640625\n",
798
- " [16:40] 0.93994140625 1.0\n",
799
- " [40:64] 1.0 1.0\n",
800
- " [64:80] -0.97314453125 0.98681640625\n",
801
- " [80:104] 0.93994140625 1.0\n",
802
- " [104:128] 1.0 1.0\n",
803
- "70 torch.Size([128])\n",
804
- " [0:16] -0.97314453125 0.98681640625\n",
805
- " [16:40] 0.93994140625 1.0\n",
806
- " [40:64] 1.0 1.0\n",
807
- " [64:80] -0.97314453125 0.98681640625\n",
808
- " [80:104] 0.93994140625 1.0\n",
809
- " [104:128] 1.0 1.0\n",
810
- "71 torch.Size([128])\n",
811
- " [0:16] -0.97314453125 0.98681640625\n",
812
- " [16:40] 0.93994140625 1.0\n",
813
- " [40:64] 1.0 1.0\n",
814
- " [64:80] -0.97314453125 0.98681640625\n",
815
- " [80:104] 0.93994140625 1.0\n",
816
- " [104:128] 1.0 1.0\n",
817
- "72 torch.Size([128])\n",
818
- " [0:16] -0.97314453125 0.98681640625\n",
819
- " [16:40] 0.93994140625 1.0\n",
820
- " [40:64] 1.0 1.0\n",
821
- " [64:80] -0.97314453125 0.98681640625\n",
822
- " [80:104] 0.93994140625 1.0\n",
823
- " [104:128] 1.0 1.0\n",
824
- "73 torch.Size([128])\n",
825
- " [0:16] -0.97314453125 0.98681640625\n",
826
- " [16:40] 0.93994140625 1.0\n",
827
- " [40:64] 1.0 1.0\n",
828
- " [64:80] -0.97314453125 0.98681640625\n",
829
- " [80:104] 0.93994140625 1.0\n",
830
- " [104:128] 1.0 1.0\n",
831
- "74 torch.Size([128])\n",
832
- " [0:16] -0.97314453125 0.98681640625\n",
833
- " [16:40] 0.93994140625 1.0\n",
834
- " [40:64] 1.0 1.0\n",
835
- " [64:80] -0.97314453125 0.98681640625\n",
836
- " [80:104] 0.93994140625 1.0\n",
837
- " [104:128] 1.0 1.0\n",
838
- "75 torch.Size([128])\n",
839
- " [0:16] -0.97314453125 0.98681640625\n",
840
- " [16:40] 0.93994140625 1.0\n",
841
- " [40:64] 1.0 1.0\n",
842
- " [64:80] -0.97314453125 0.98681640625\n",
843
- " [80:104] 0.93994140625 1.0\n",
844
- " [104:128] 1.0 1.0\n",
845
- "76 torch.Size([128])\n",
846
- " [0:16] -0.97314453125 0.98681640625\n",
847
- " [16:40] 0.9287109375 1.0\n",
848
- " [40:64] 1.0 1.0\n",
849
- " [64:80] -0.97314453125 0.98681640625\n",
850
- " [80:104] 0.9287109375 1.0\n",
851
- " [104:128] 1.0 1.0\n",
852
- "77 torch.Size([128])\n",
853
- " [0:16] -0.97314453125 0.98681640625\n",
854
- " [16:40] 0.9287109375 1.0\n",
855
- " [40:64] 1.0 1.0\n",
856
- " [64:80] -0.97314453125 0.98681640625\n",
857
- " [80:104] 0.9287109375 1.0\n",
858
- " [104:128] 1.0 1.0\n",
859
- "78 torch.Size([128])\n",
860
- " [0:16] -0.97314453125 0.98681640625\n",
861
- " [16:40] 0.9287109375 1.0\n",
862
- " [40:64] 1.0 1.0\n",
863
- " [64:80] -0.97314453125 0.98681640625\n",
864
- " [80:104] 0.9287109375 1.0\n",
865
- " [104:128] 1.0 1.0\n",
866
- "79 torch.Size([128])\n",
867
- " [0:16] -0.97314453125 0.98681640625\n",
868
- " [16:40] 0.9287109375 1.0\n",
869
- " [40:64] 1.0 1.0\n",
870
- " [64:80] -0.97314453125 0.98681640625\n",
871
- " [80:104] 0.9287109375 1.0\n",
872
- " [104:128] 1.0 1.0\n",
873
- "80 torch.Size([128])\n",
874
- " [0:16] -0.97314453125 0.98681640625\n",
875
- " [16:40] 0.9287109375 1.0\n",
876
- " [40:64] 1.0 1.0\n",
877
- " [64:80] -0.97314453125 0.98681640625\n",
878
- " [80:104] 0.9287109375 1.0\n",
879
- " [104:128] 1.0 1.0\n",
880
- "81 torch.Size([128])\n",
881
- " [0:16] -0.97314453125 0.98681640625\n",
882
- " [16:40] 0.9287109375 1.0\n",
883
- " [40:64] 1.0 1.0\n",
884
- " [64:80] -0.97314453125 0.98681640625\n",
885
- " [80:104] 0.9287109375 1.0\n",
886
- " [104:128] 1.0 1.0\n",
887
- "82 torch.Size([128])\n",
888
- " [0:16] -0.97314453125 0.98681640625\n",
889
- " [16:40] 0.9287109375 1.0\n",
890
- " [40:64] 1.0 1.0\n",
891
- " [64:80] -0.97314453125 0.98681640625\n",
892
- " [80:104] 0.9287109375 1.0\n",
893
- " [104:128] 1.0 1.0\n",
894
- "83 torch.Size([128])\n",
895
- " [0:16] -0.97314453125 0.98681640625\n",
896
- " [16:40] 0.9287109375 1.0\n",
897
- " [40:64] 1.0 1.0\n",
898
- " [64:80] -0.97314453125 0.98681640625\n",
899
- " [80:104] 0.9287109375 1.0\n",
900
- " [104:128] 1.0 1.0\n",
901
- "84 torch.Size([128])\n",
902
- " [0:16] -0.97314453125 0.98681640625\n",
903
- " [16:40] 0.9287109375 1.0\n",
904
- " [40:64] 1.0 1.0\n",
905
- " [64:80] -0.97314453125 0.98681640625\n",
906
- " [80:104] 0.9287109375 1.0\n",
907
- " [104:128] 1.0 1.0\n",
908
- "85 torch.Size([128])\n",
909
- " [0:16] -0.962890625 0.9072265625\n",
910
- " [16:40] 0.91650390625 1.0\n",
911
- " [40:64] 1.0 1.0\n",
912
- " [64:80] -0.962890625 0.9072265625\n",
913
- " [80:104] 0.91650390625 1.0\n",
914
- " [104:128] 1.0 1.0\n",
915
- "86 torch.Size([128])\n",
916
- " [0:16] -0.99853515625 0.9287109375\n",
917
- " [16:40] 0.90380859375 1.0\n",
918
- " [40:64] 1.0 1.0\n",
919
- " [64:80] -0.99853515625 0.9287109375\n",
920
- " [80:104] 0.90380859375 1.0\n",
921
- " [104:128] 1.0 1.0\n",
922
- "87 torch.Size([128])\n",
923
- " [0:16] -0.98583984375 0.9990234375\n",
924
- " [16:40] 0.8896484375 1.0\n",
925
- " [40:64] 1.0 1.0\n",
926
- " [64:80] -0.98583984375 0.9990234375\n",
927
- " [80:104] 0.8896484375 1.0\n",
928
- " [104:128] 1.0 1.0\n",
929
- "88 torch.Size([128])\n",
930
- " [0:16] -0.95751953125 0.94677734375\n",
931
- " [16:40] 0.87451171875 1.0\n",
932
- " [40:64] 1.0 1.0\n",
933
- " [64:80] -0.95751953125 0.94677734375\n",
934
- " [80:104] 0.87451171875 1.0\n",
935
- " [104:128] 1.0 1.0\n",
936
- "89 torch.Size([128])\n",
937
- " [0:16] -0.9931640625 0.87451171875\n",
938
- " [16:40] 0.85888671875 1.0\n",
939
- " [40:64] 1.0 1.0\n",
940
- " [64:80] -0.9931640625 0.87451171875\n",
941
- " [80:104] 0.85888671875 1.0\n",
942
- " [104:128] 1.0 1.0\n",
943
- "90 torch.Size([128])\n",
944
- " [0:16] -1.0 0.986328125\n",
945
- " [16:40] 0.84228515625 1.0\n",
946
- " [40:64] 1.0 1.0\n",
947
- " [64:80] -1.0 0.986328125\n",
948
- " [80:104] 0.84228515625 1.0\n",
949
- " [104:128] 1.0 1.0\n",
950
- "91 torch.Size([128])\n",
951
- " [0:16] -0.97216796875 0.98876953125\n",
952
- " [16:40] 0.82470703125 1.0\n",
953
- " [40:64] 1.0 1.0\n",
954
- " [64:80] -0.97216796875 0.98876953125\n",
955
- " [80:104] 0.82470703125 1.0\n",
956
- " [104:128] 1.0 1.0\n",
957
- "92 torch.Size([128])\n",
958
- " [0:16] -0.96240234375 0.91259765625\n",
959
- " [16:40] 0.806640625 1.0\n",
960
- " [40:64] 1.0 1.0\n",
961
- " [64:80] -0.96240234375 0.91259765625\n",
962
- " [80:104] 0.806640625 1.0\n",
963
- " [104:128] 1.0 1.0\n",
964
- "93 torch.Size([128])\n",
965
- " [0:16] -0.9912109375 0.861328125\n",
966
- " [16:40] 0.78759765625 1.0\n",
967
- " [40:64] 1.0 1.0\n",
968
- " [64:80] -0.9912109375 0.861328125\n",
969
- " [80:104] 0.78759765625 1.0\n",
970
- " [104:128] 1.0 1.0\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
971
  ]
972
  }
973
  ],
974
  "source": [
975
  "cos_reshaped = cos.squeeze(0).squeeze(0)\n",
 
 
976
  "for idx, tensor in enumerate(cos_reshaped):\n",
977
- " print(idx, tensor.shape)\n",
978
  " # print(tensor[16:40].flatten().tolist())\n",
979
- " if tensor.shape[0] != 128:\n",
980
- " print(f\"Skipping tensor {idx} with shape {tensor.shape}\")\n",
981
- " continue\n",
982
- " else:\n",
983
- " print(f\" [0:16] {tensor[0:16].min()} {tensor[0:16].max()}\")\n",
984
- " print(f\" [16:40] {tensor[16:40].min()} {tensor[16:40].max()}\")\n",
985
- " print(f\" [40:64] {tensor[40:64].min()} {tensor[40:64].max()}\")\n",
986
- " print(f\" [64:80] {tensor[64:80].min()} {tensor[64:80].max()}\")\n",
987
- " print(f\" [80:104] {tensor[80:104].min()} {tensor[80:104].max()}\")\n",
988
- " print(f\" [104:128] {tensor[104:128].min()} {tensor[104:128].max()}\")"
989
  ]
990
  },
991
  {
 
293
  },
294
  {
295
  "cell_type": "code",
296
+ "execution_count": 19,
297
  "id": "039f1456-ffa4-40b2-8ba1-a0cd5f74733e",
298
  "metadata": {
299
  "execution": {
300
+ "iopub.execute_input": "2026-03-25T09:39:03.854302Z",
301
+ "iopub.status.busy": "2026-03-25T09:39:03.854035Z",
302
+ "iopub.status.idle": "2026-03-25T09:39:03.944941Z",
303
+ "shell.execute_reply": "2026-03-25T09:39:03.944353Z",
304
+ "shell.execute_reply.started": "2026-03-25T09:39:03.854284Z"
305
  },
306
  "scrolled": true
307
  },
 
310
  "name": "stdout",
311
  "output_type": "stream",
312
  "text": [
313
+ "\n",
314
+ " 0 torch.Size([128])\n",
315
+ " [ 0: 16] - 16 | [1.0, 1.0]\n",
316
+ " [ 16: 40] - 24 | [1.0, 1.0]\n",
317
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
318
+ " [ 64: 80] - 16 | [1.0, 1.0]\n",
319
+ " [ 80:104] - 24 | [1.0, 1.0]\n",
320
+ " [104:128] - 24 | [1.0, 1.0]\n",
321
+ "\n",
322
+ " 1 torch.Size([128])\n",
323
+ " [ 0: 16] - 0 | [0.54052734375, 0.9990234375]\n",
324
+ " [ 16: 40] - 22 | [0.99951171875, 1.0]\n",
325
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
326
+ " [ 64: 80] - 0 | [0.54052734375, 0.9990234375]\n",
327
+ " [ 80:104] - 22 | [0.99951171875, 1.0]\n",
328
+ " [104:128] - 24 | [1.0, 1.0]\n",
329
+ "\n",
330
+ " 2 torch.Size([128])\n",
331
+ " [ 0: 16] - 0 | [-0.416259765625, 0.9970703125]\n",
332
+ " [ 16: 40] - 19 | [0.998046875, 1.0]\n",
333
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
334
+ " [ 64: 80] - 0 | [-0.416259765625, 0.9970703125]\n",
335
+ " [ 80:104] - 19 | [0.998046875, 1.0]\n",
336
+ " [104:128] - 24 | [1.0, 1.0]\n",
337
+ "\n",
338
+ " 3 torch.Size([128])\n",
339
+ " [ 0: 16] - 0 | [-0.990234375, 0.9931640625]\n",
340
+ " [ 16: 40] - 17 | [0.99560546875, 1.0]\n",
341
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
342
+ " [ 64: 80] - 0 | [-0.990234375, 0.9931640625]\n",
343
+ " [ 80:104] - 17 | [0.99560546875, 1.0]\n",
344
+ " [104:128] - 24 | [1.0, 1.0]\n",
345
+ "\n",
346
+ " 4 torch.Size([128])\n",
347
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
348
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
349
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
350
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
351
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
352
+ " [104:128] - 24 | [1.0, 1.0]\n",
353
+ "\n",
354
+ " 5 torch.Size([128])\n",
355
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
356
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
357
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
358
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
359
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
360
+ " [104:128] - 24 | [1.0, 1.0]\n",
361
+ "\n",
362
+ " 6 torch.Size([128])\n",
363
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
364
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
365
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
366
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
367
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
368
+ " [104:128] - 24 | [1.0, 1.0]\n",
369
+ "\n",
370
+ " 7 torch.Size([128])\n",
371
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
372
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
373
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
374
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
375
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
376
+ " [104:128] - 24 | [1.0, 1.0]\n",
377
+ "\n",
378
+ " 8 torch.Size([128])\n",
379
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
380
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
381
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
382
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
383
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
384
+ " [104:128] - 24 | [1.0, 1.0]\n",
385
+ "\n",
386
+ " 9 torch.Size([128])\n",
387
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
388
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
389
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
390
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
391
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
392
+ " [104:128] - 24 | [1.0, 1.0]\n",
393
+ "\n",
394
+ " 10 torch.Size([128])\n",
395
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
396
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
397
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
398
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
399
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
400
+ " [104:128] - 24 | [1.0, 1.0]\n",
401
+ "\n",
402
+ " 11 torch.Size([128])\n",
403
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
404
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
405
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
406
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
407
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
408
+ " [104:128] - 24 | [1.0, 1.0]\n",
409
+ "\n",
410
+ " 12 torch.Size([128])\n",
411
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
412
+ " [ 16: 40] - 15 | [0.9921875, 1.0]\n",
413
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
414
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
415
+ " [ 80:104] - 15 | [0.9921875, 1.0]\n",
416
+ " [104:128] - 24 | [1.0, 1.0]\n",
417
+ "\n",
418
+ " 13 torch.Size([128])\n",
419
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
420
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
421
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
422
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
423
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
424
+ " [104:128] - 24 | [1.0, 1.0]\n",
425
+ "\n",
426
+ " 14 torch.Size([128])\n",
427
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
428
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
429
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
430
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
431
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
432
+ " [104:128] - 24 | [1.0, 1.0]\n",
433
+ "\n",
434
+ " 15 torch.Size([128])\n",
435
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
436
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
437
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
438
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
439
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
440
+ " [104:128] - 24 | [1.0, 1.0]\n",
441
+ "\n",
442
+ " 16 torch.Size([128])\n",
443
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
444
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
445
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
446
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
447
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
448
+ " [104:128] - 24 | [1.0, 1.0]\n",
449
+ "\n",
450
+ " 17 torch.Size([128])\n",
451
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
452
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
453
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
454
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
455
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
456
+ " [104:128] - 24 | [1.0, 1.0]\n",
457
+ "\n",
458
+ " 18 torch.Size([128])\n",
459
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
460
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
461
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
462
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
463
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
464
+ " [104:128] - 24 | [1.0, 1.0]\n",
465
+ "\n",
466
+ " 19 torch.Size([128])\n",
467
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
468
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
469
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
470
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
471
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
472
+ " [104:128] - 24 | [1.0, 1.0]\n",
473
+ "\n",
474
+ " 20 torch.Size([128])\n",
475
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
476
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
477
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
478
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
479
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
480
+ " [104:128] - 24 | [1.0, 1.0]\n",
481
+ "\n",
482
+ " 21 torch.Size([128])\n",
483
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
484
+ " [ 16: 40] - 14 | [0.9873046875, 1.0]\n",
485
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
486
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
487
+ " [ 80:104] - 14 | [0.9873046875, 1.0]\n",
488
+ " [104:128] - 24 | [1.0, 1.0]\n",
489
+ "\n",
490
+ " 22 torch.Size([128])\n",
491
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
492
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
493
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
494
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
495
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
496
+ " [104:128] - 24 | [1.0, 1.0]\n",
497
+ "\n",
498
+ " 23 torch.Size([128])\n",
499
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
500
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
501
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
502
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
503
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
504
+ " [104:128] - 24 | [1.0, 1.0]\n",
505
+ "\n",
506
+ " 24 torch.Size([128])\n",
507
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
508
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
509
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
510
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
511
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
512
+ " [104:128] - 24 | [1.0, 1.0]\n",
513
+ "\n",
514
+ " 25 torch.Size([128])\n",
515
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
516
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
517
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
518
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
519
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
520
+ " [104:128] - 24 | [1.0, 1.0]\n",
521
+ "\n",
522
+ " 26 torch.Size([128])\n",
523
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
524
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
525
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
526
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
527
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
528
+ " [104:128] - 24 | [1.0, 1.0]\n",
529
+ "\n",
530
+ " 27 torch.Size([128])\n",
531
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
532
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
533
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
534
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
535
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
536
+ " [104:128] - 24 | [1.0, 1.0]\n",
537
+ "\n",
538
+ " 28 torch.Size([128])\n",
539
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
540
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
541
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
542
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
543
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
544
+ " [104:128] - 24 | [1.0, 1.0]\n",
545
+ "\n",
546
+ " 29 torch.Size([128])\n",
547
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
548
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
549
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
550
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
551
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
552
+ " [104:128] - 24 | [1.0, 1.0]\n",
553
+ "\n",
554
+ " 30 torch.Size([128])\n",
555
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
556
+ " [ 16: 40] - 14 | [0.98193359375, 1.0]\n",
557
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
558
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
559
+ " [ 80:104] - 14 | [0.98193359375, 1.0]\n",
560
+ " [104:128] - 24 | [1.0, 1.0]\n",
561
+ "\n",
562
+ " 31 torch.Size([128])\n",
563
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
564
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
565
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
566
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
567
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
568
+ " [104:128] - 24 | [1.0, 1.0]\n",
569
+ "\n",
570
+ " 32 torch.Size([128])\n",
571
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
572
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
573
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
574
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
575
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
576
+ " [104:128] - 24 | [1.0, 1.0]\n",
577
+ "\n",
578
+ " 33 torch.Size([128])\n",
579
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
580
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
581
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
582
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
583
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
584
+ " [104:128] - 24 | [1.0, 1.0]\n",
585
+ "\n",
586
+ " 34 torch.Size([128])\n",
587
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
588
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
589
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
590
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
591
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
592
+ " [104:128] - 24 | [1.0, 1.0]\n",
593
+ "\n",
594
+ " 35 torch.Size([128])\n",
595
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
596
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
597
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
598
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
599
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
600
+ " [104:128] - 24 | [1.0, 1.0]\n",
601
+ "\n",
602
+ " 36 torch.Size([128])\n",
603
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
604
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
605
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
606
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
607
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
608
+ " [104:128] - 24 | [1.0, 1.0]\n",
609
+ "\n",
610
+ " 37 torch.Size([128])\n",
611
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
612
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
613
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
614
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
615
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
616
+ " [104:128] - 24 | [1.0, 1.0]\n",
617
+ "\n",
618
+ " 38 torch.Size([128])\n",
619
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
620
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
621
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
622
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
623
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
624
+ " [104:128] - 24 | [1.0, 1.0]\n",
625
+ "\n",
626
+ " 39 torch.Size([128])\n",
627
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
628
+ " [ 16: 40] - 13 | [0.9755859375, 1.0]\n",
629
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
630
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
631
+ " [ 80:104] - 13 | [0.9755859375, 1.0]\n",
632
+ " [104:128] - 24 | [1.0, 1.0]\n",
633
+ "\n",
634
+ " 40 torch.Size([128])\n",
635
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
636
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
637
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
638
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
639
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
640
+ " [104:128] - 24 | [1.0, 1.0]\n",
641
+ "\n",
642
+ " 41 torch.Size([128])\n",
643
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
644
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
645
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
646
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
647
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
648
+ " [104:128] - 24 | [1.0, 1.0]\n",
649
+ "\n",
650
+ " 42 torch.Size([128])\n",
651
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
652
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
653
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
654
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
655
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
656
+ " [104:128] - 24 | [1.0, 1.0]\n",
657
+ "\n",
658
+ " 43 torch.Size([128])\n",
659
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
660
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
661
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
662
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
663
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
664
+ " [104:128] - 24 | [1.0, 1.0]\n",
665
+ "\n",
666
+ " 44 torch.Size([128])\n",
667
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
668
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
669
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
670
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
671
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
672
+ " [104:128] - 24 | [1.0, 1.0]\n",
673
+ "\n",
674
+ " 45 torch.Size([128])\n",
675
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
676
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
677
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
678
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
679
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
680
+ " [104:128] - 24 | [1.0, 1.0]\n",
681
+ "\n",
682
+ " 46 torch.Size([128])\n",
683
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
684
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
685
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
686
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
687
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
688
+ " [104:128] - 24 | [1.0, 1.0]\n",
689
+ "\n",
690
+ " 47 torch.Size([128])\n",
691
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
692
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
693
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
694
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
695
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
696
+ " [104:128] - 24 | [1.0, 1.0]\n",
697
+ "\n",
698
+ " 48 torch.Size([128])\n",
699
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
700
+ " [ 16: 40] - 12 | [0.96826171875, 1.0]\n",
701
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
702
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
703
+ " [ 80:104] - 12 | [0.96826171875, 1.0]\n",
704
+ " [104:128] - 24 | [1.0, 1.0]\n",
705
+ "\n",
706
+ " 49 torch.Size([128])\n",
707
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
708
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
709
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
710
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
711
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
712
+ " [104:128] - 24 | [1.0, 1.0]\n",
713
+ "\n",
714
+ " 50 torch.Size([128])\n",
715
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
716
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
717
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
718
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
719
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
720
+ " [104:128] - 24 | [1.0, 1.0]\n",
721
+ "\n",
722
+ " 51 torch.Size([128])\n",
723
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
724
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
725
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
726
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
727
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
728
+ " [104:128] - 24 | [1.0, 1.0]\n",
729
+ "\n",
730
+ " 52 torch.Size([128])\n",
731
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
732
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
733
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
734
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
735
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
736
+ " [104:128] - 24 | [1.0, 1.0]\n",
737
+ "\n",
738
+ " 53 torch.Size([128])\n",
739
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
740
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
741
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
742
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
743
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
744
+ " [104:128] - 24 | [1.0, 1.0]\n",
745
+ "\n",
746
+ " 54 torch.Size([128])\n",
747
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
748
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
749
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
750
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
751
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
752
+ " [104:128] - 24 | [1.0, 1.0]\n",
753
+ "\n",
754
+ " 55 torch.Size([128])\n",
755
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
756
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
757
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
758
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
759
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
760
+ " [104:128] - 24 | [1.0, 1.0]\n",
761
+ "\n",
762
+ " 56 torch.Size([128])\n",
763
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
764
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
765
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
766
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
767
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
768
+ " [104:128] - 24 | [1.0, 1.0]\n",
769
+ "\n",
770
+ " 57 torch.Size([128])\n",
771
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
772
+ " [ 16: 40] - 12 | [0.9599609375, 1.0]\n",
773
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
774
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
775
+ " [ 80:104] - 12 | [0.9599609375, 1.0]\n",
776
+ " [104:128] - 24 | [1.0, 1.0]\n",
777
+ "\n",
778
+ " 58 torch.Size([128])\n",
779
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
780
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
781
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
782
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
783
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
784
+ " [104:128] - 24 | [1.0, 1.0]\n",
785
+ "\n",
786
+ " 59 torch.Size([128])\n",
787
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
788
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
789
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
790
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
791
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
792
+ " [104:128] - 24 | [1.0, 1.0]\n",
793
+ "\n",
794
+ " 60 torch.Size([128])\n",
795
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
796
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
797
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
798
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
799
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
800
+ " [104:128] - 24 | [1.0, 1.0]\n",
801
+ "\n",
802
+ " 61 torch.Size([128])\n",
803
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
804
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
805
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
806
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
807
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
808
+ " [104:128] - 24 | [1.0, 1.0]\n",
809
+ "\n",
810
+ " 62 torch.Size([128])\n",
811
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
812
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
813
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
814
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
815
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
816
+ " [104:128] - 24 | [1.0, 1.0]\n",
817
+ "\n",
818
+ " 63 torch.Size([128])\n",
819
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
820
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
821
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
822
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
823
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
824
+ " [104:128] - 24 | [1.0, 1.0]\n",
825
+ "\n",
826
+ " 64 torch.Size([128])\n",
827
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
828
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
829
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
830
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
831
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
832
+ " [104:128] - 24 | [1.0, 1.0]\n",
833
+ "\n",
834
+ " 65 torch.Size([128])\n",
835
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
836
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
837
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
838
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
839
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
840
+ " [104:128] - 24 | [1.0, 1.0]\n",
841
+ "\n",
842
+ " 66 torch.Size([128])\n",
843
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
844
+ " [ 16: 40] - 11 | [0.9501953125, 1.0]\n",
845
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
846
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
847
+ " [ 80:104] - 11 | [0.9501953125, 1.0]\n",
848
+ " [104:128] - 24 | [1.0, 1.0]\n",
849
+ "\n",
850
+ " 67 torch.Size([128])\n",
851
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
852
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
853
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
854
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
855
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
856
+ " [104:128] - 24 | [1.0, 1.0]\n",
857
+ "\n",
858
+ " 68 torch.Size([128])\n",
859
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
860
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
861
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
862
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
863
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
864
+ " [104:128] - 24 | [1.0, 1.0]\n",
865
+ "\n",
866
+ " 69 torch.Size([128])\n",
867
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
868
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
869
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
870
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
871
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
872
+ " [104:128] - 24 | [1.0, 1.0]\n",
873
+ "\n",
874
+ " 70 torch.Size([128])\n",
875
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
876
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
877
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
878
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
879
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
880
+ " [104:128] - 24 | [1.0, 1.0]\n",
881
+ "\n",
882
+ " 71 torch.Size([128])\n",
883
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
884
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
885
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
886
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
887
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
888
+ " [104:128] - 24 | [1.0, 1.0]\n",
889
+ "\n",
890
+ " 72 torch.Size([128])\n",
891
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
892
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
893
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
894
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
895
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
896
+ " [104:128] - 24 | [1.0, 1.0]\n",
897
+ "\n",
898
+ " 73 torch.Size([128])\n",
899
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
900
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
901
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
902
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
903
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
904
+ " [104:128] - 24 | [1.0, 1.0]\n",
905
+ "\n",
906
+ " 74 torch.Size([128])\n",
907
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
908
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
909
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
910
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
911
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
912
+ " [104:128] - 24 | [1.0, 1.0]\n",
913
+ "\n",
914
+ " 75 torch.Size([128])\n",
915
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
916
+ " [ 16: 40] - 11 | [0.93994140625, 1.0]\n",
917
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
918
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
919
+ " [ 80:104] - 11 | [0.93994140625, 1.0]\n",
920
+ " [104:128] - 24 | [1.0, 1.0]\n",
921
+ "\n",
922
+ " 76 torch.Size([128])\n",
923
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
924
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
925
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
926
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
927
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
928
+ " [104:128] - 24 | [1.0, 1.0]\n",
929
+ "\n",
930
+ " 77 torch.Size([128])\n",
931
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
932
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
933
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
934
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
935
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
936
+ " [104:128] - 24 | [1.0, 1.0]\n",
937
+ "\n",
938
+ " 78 torch.Size([128])\n",
939
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
940
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
941
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
942
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
943
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
944
+ " [104:128] - 24 | [1.0, 1.0]\n",
945
+ "\n",
946
+ " 79 torch.Size([128])\n",
947
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
948
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
949
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
950
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
951
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
952
+ " [104:128] - 24 | [1.0, 1.0]\n",
953
+ "\n",
954
+ " 80 torch.Size([128])\n",
955
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
956
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
957
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
958
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
959
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
960
+ " [104:128] - 24 | [1.0, 1.0]\n",
961
+ "\n",
962
+ " 81 torch.Size([128])\n",
963
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
964
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
965
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
966
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
967
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
968
+ " [104:128] - 24 | [1.0, 1.0]\n",
969
+ "\n",
970
+ " 82 torch.Size([128])\n",
971
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
972
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
973
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
974
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
975
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
976
+ " [104:128] - 24 | [1.0, 1.0]\n",
977
+ "\n",
978
+ " 83 torch.Size([128])\n",
979
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
980
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
981
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
982
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
983
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
984
+ " [104:128] - 24 | [1.0, 1.0]\n",
985
+ "\n",
986
+ " 84 torch.Size([128])\n",
987
+ " [ 0: 16] - 0 | [-0.97314453125, 0.98681640625]\n",
988
+ " [ 16: 40] - 10 | [0.9287109375, 1.0]\n",
989
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
990
+ " [ 64: 80] - 0 | [-0.97314453125, 0.98681640625]\n",
991
+ " [ 80:104] - 10 | [0.9287109375, 1.0]\n",
992
+ " [104:128] - 24 | [1.0, 1.0]\n",
993
+ "\n",
994
+ " 85 torch.Size([128])\n",
995
+ " [ 0: 16] - 0 | [-0.962890625, 0.9072265625]\n",
996
+ " [ 16: 40] - 10 | [0.91650390625, 1.0]\n",
997
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
998
+ " [ 64: 80] - 0 | [-0.962890625, 0.9072265625]\n",
999
+ " [ 80:104] - 10 | [0.91650390625, 1.0]\n",
1000
+ " [104:128] - 24 | [1.0, 1.0]\n",
1001
+ "\n",
1002
+ " 86 torch.Size([128])\n",
1003
+ " [ 0: 16] - 0 | [-0.99853515625, 0.9287109375]\n",
1004
+ " [ 16: 40] - 10 | [0.90380859375, 1.0]\n",
1005
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1006
+ " [ 64: 80] - 0 | [-0.99853515625, 0.9287109375]\n",
1007
+ " [ 80:104] - 10 | [0.90380859375, 1.0]\n",
1008
+ " [104:128] - 24 | [1.0, 1.0]\n",
1009
+ "\n",
1010
+ " 87 torch.Size([128])\n",
1011
+ " [ 0: 16] - 0 | [-0.98583984375, 0.9990234375]\n",
1012
+ " [ 16: 40] - 9 | [0.8896484375, 1.0]\n",
1013
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1014
+ " [ 64: 80] - 0 | [-0.98583984375, 0.9990234375]\n",
1015
+ " [ 80:104] - 9 | [0.8896484375, 1.0]\n",
1016
+ " [104:128] - 24 | [1.0, 1.0]\n",
1017
+ "\n",
1018
+ " 88 torch.Size([128])\n",
1019
+ " [ 0: 16] - 0 | [-0.95751953125, 0.94677734375]\n",
1020
+ " [ 16: 40] - 9 | [0.87451171875, 1.0]\n",
1021
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1022
+ " [ 64: 80] - 0 | [-0.95751953125, 0.94677734375]\n",
1023
+ " [ 80:104] - 9 | [0.87451171875, 1.0]\n",
1024
+ " [104:128] - 24 | [1.0, 1.0]\n",
1025
+ "\n",
1026
+ " 89 torch.Size([128])\n",
1027
+ " [ 0: 16] - 0 | [-0.9931640625, 0.87451171875]\n",
1028
+ " [ 16: 40] - 9 | [0.85888671875, 1.0]\n",
1029
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1030
+ " [ 64: 80] - 0 | [-0.9931640625, 0.87451171875]\n",
1031
+ " [ 80:104] - 9 | [0.85888671875, 1.0]\n",
1032
+ " [104:128] - 24 | [1.0, 1.0]\n",
1033
+ "\n",
1034
+ " 90 torch.Size([128])\n",
1035
+ " [ 0: 16] - 0 | [-1.0, 0.986328125]\n",
1036
+ " [ 16: 40] - 8 | [0.84228515625, 1.0]\n",
1037
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1038
+ " [ 64: 80] - 0 | [-1.0, 0.986328125]\n",
1039
+ " [ 80:104] - 8 | [0.84228515625, 1.0]\n",
1040
+ " [104:128] - 24 | [1.0, 1.0]\n",
1041
+ "\n",
1042
+ " 91 torch.Size([128])\n",
1043
+ " [ 0: 16] - 0 | [-0.97216796875, 0.98876953125]\n",
1044
+ " [ 16: 40] - 8 | [0.82470703125, 1.0]\n",
1045
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1046
+ " [ 64: 80] - 0 | [-0.97216796875, 0.98876953125]\n",
1047
+ " [ 80:104] - 8 | [0.82470703125, 1.0]\n",
1048
+ " [104:128] - 24 | [1.0, 1.0]\n",
1049
+ "\n",
1050
+ " 92 torch.Size([128])\n",
1051
+ " [ 0: 16] - 0 | [-0.96240234375, 0.91259765625]\n",
1052
+ " [ 16: 40] - 8 | [0.806640625, 1.0]\n",
1053
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1054
+ " [ 64: 80] - 0 | [-0.96240234375, 0.91259765625]\n",
1055
+ " [ 80:104] - 8 | [0.806640625, 1.0]\n",
1056
+ " [104:128] - 24 | [1.0, 1.0]\n",
1057
+ "\n",
1058
+ " 93 torch.Size([128])\n",
1059
+ " [ 0: 16] - 0 | [-0.9912109375, 0.861328125]\n",
1060
+ " [ 16: 40] - 8 | [0.78759765625, 1.0]\n",
1061
+ " [ 40: 64] - 24 | [1.0, 1.0]\n",
1062
+ " [ 64: 80] - 0 | [-0.9912109375, 0.861328125]\n",
1063
+ " [ 80:104] - 8 | [0.78759765625, 1.0]\n",
1064
+ " [104:128] - 24 | [1.0, 1.0]\n"
1065
  ]
1066
  }
1067
  ],
1068
  "source": [
1069
  "cos_reshaped = cos.squeeze(0).squeeze(0)\n",
1070
+ "ranges = [(0, 16), (16, 40), (40, 64), (64, 80), (80, 104), (104, 128)]\n",
1071
+ "\n",
1072
  "for idx, tensor in enumerate(cos_reshaped):\n",
1073
+ " print('\\n', idx, tensor.shape)\n",
1074
  " # print(tensor[16:40].flatten().tolist())\n",
1075
+ " for start, end in ranges:\n",
1076
+ " print(f\" [{start :3}:{end :3}] - {(tensor[start:end] == 1.0).sum().item() :2} | [{tensor[start:end].min()}, {tensor[start:end].max()}]\")"
 
 
 
 
 
 
 
 
1077
  ]
1078
  },
1079
  {