diff --git "a/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" "b/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" --- "a/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" +++ "b/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.9784, "train/learning_rate": 9.345794392523364e-07, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 8574, "_timestamp": 1646219749, "_step": 1787, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 13.0, 17.0, 52.0, 415.0, 420.0, 70.0, 16.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-925.3422241210938, -902.2313232421875, -879.120361328125, -856.0094604492188, -832.8985595703125, -809.78759765625, -786.6766967773438, -763.5657958984375, -740.454833984375, -717.3439331054688, -694.2329711914062, -671.1220703125, -648.0111083984375, -624.9002075195312, -601.789306640625, -578.6783447265625, -555.5674438476562, -532.45654296875, -509.3455810546875, -486.23468017578125, -463.1237487792969, -440.0128173828125, -416.90191650390625, -393.7909851074219, -370.6800537109375, -347.5691223144531, -324.45819091796875, -301.3472900390625, -278.2363586425781, -255.12542724609375, -232.01451110839844, -208.90359497070312, -185.79266357421875, -162.68173217773438, -139.57081604003906, -116.45989227294922, -93.34896850585938, -70.23804473876953, -47.12712097167969, -24.016204833984375, -0.9052734375, 22.205650329589844, 45.31657409667969, 68.42749786376953, 91.53842163085938, 114.64934539794922, 137.76026916503906, 160.87118530273438, 183.98211669921875, 207.09304809570312, 230.20396423339844, 253.31488037109375, 276.4258117675781, 299.5367431640625, 322.64764404296875, 345.7585754394531, 368.8695068359375, 391.9804382324219, 415.09136962890625, 438.2022705078125, 461.3132019042969, 484.42413330078125, 507.5350341796875, 530.64599609375, 553.7568969726562]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 11.0, 7.0, 8.0, 15.0, 18.0, 21.0, 20.0, 18.0, 25.0, 30.0, 34.0, 27.0, 70.0, 176.0, 140.0, 82.0, 30.0, 23.0, 28.0, 28.0, 23.0, 23.0, 17.0, 17.0, 14.0, 13.0, 5.0, 7.0, 10.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-667.4768676757812, -646.577392578125, -625.6779174804688, -604.7784423828125, -583.8789672851562, -562.9794921875, -542.0800170898438, -521.1805419921875, -500.2810974121094, -479.3816223144531, -458.4821472167969, -437.5826721191406, -416.6832275390625, -395.78375244140625, -374.88427734375, -353.98480224609375, -333.0853271484375, -312.18585205078125, -291.286376953125, -270.38690185546875, -249.48744201660156, -228.5879669189453, -207.68850708007812, -186.78903198242188, -165.88955688476562, -144.99008178710938, -124.09061431884766, -103.19114685058594, -82.29167175292969, -61.39219665527344, -40.49272918701172, -19.59326171875, 1.30621337890625, 22.205684661865234, 43.10515594482422, 64.00462341308594, 84.90409851074219, 105.80357360839844, 126.70304107666016, 147.60250854492188, 168.50198364257812, 189.40145874023438, 210.30093383789062, 231.2003936767578, 252.09986877441406, 272.99932861328125, 293.8988037109375, 314.79827880859375, 335.69775390625, 356.59722900390625, 377.4967041015625, 398.39617919921875, 419.295654296875, 440.19512939453125, 461.0945739746094, 481.9940490722656, 502.8935241699219, 523.79296875, 544.6924438476562, 565.5919189453125, 586.4913940429688, 607.390869140625, 628.2903442382812, 649.1898193359375, 670.0892944335938]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 5.0, 10.0, 14.0, 11.0, 24.0, 20.0, 21.0, 19.0, 28.0, 39.0, 25.0, 67.0, 113.0, 133.0, 109.0, 60.0, 33.0, 24.0, 25.0, 24.0, 23.0, 21.0, 16.0, 22.0, 8.0, 11.0, 9.0, 5.0, 6.0, 9.0, 1.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.5013427734375, -10.143310546875, -9.7852783203125, -9.42724609375, -9.0692138671875, -8.711181640625, -8.3531494140625, -7.9951171875, -7.6370849609375, -7.279052734375, -6.9210205078125, -6.56298828125, -6.2049560546875, -5.846923828125, -5.4888916015625, -5.130859375, -4.7728271484375, -4.414794921875, -4.0567626953125, -3.69873046875, -3.3406982421875, -2.982666015625, -2.6246337890625, -2.2666015625, -1.9085693359375, -1.550537109375, -1.1925048828125, -0.83447265625, -0.4764404296875, -0.118408203125, 0.2396240234375, 0.59765625, 0.9556884765625, 1.313720703125, 1.6717529296875, 2.02978515625, 2.3878173828125, 2.745849609375, 3.1038818359375, 3.4619140625, 3.8199462890625, 4.177978515625, 4.5360107421875, 4.89404296875, 5.2520751953125, 5.610107421875, 5.9681396484375, 6.326171875, 6.6842041015625, 7.042236328125, 7.4002685546875, 7.75830078125, 8.1163330078125, 8.474365234375, 8.8323974609375, 9.1904296875, 9.5484619140625, 9.906494140625, 10.2645263671875, 10.62255859375, 10.9805908203125, 11.338623046875, 11.6966552734375, 12.0546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 14.0, 21.0, 33.0, 36.0, 59.0, 58.0, 72.0, 88.0, 145.0, 197.0, 306.0, 383.0, 600.0, 1027.0, 1953.0, 3929.0, 10399.0, 43091.0, 4044670.0, 65124.0, 12372.0, 4412.0, 2005.0, 1166.0, 640.0, 383.0, 269.0, 216.0, 166.0, 105.0, 78.0, 52.0, 40.0, 26.0, 31.0, 22.0, 17.0, 20.0, 7.0, 8.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-107.3125, -103.802734375, -100.29296875, -96.783203125, -93.2734375, -89.763671875, -86.25390625, -82.744140625, -79.234375, -75.724609375, -72.21484375, -68.705078125, -65.1953125, -61.685546875, -58.17578125, -54.666015625, -51.15625, -47.646484375, -44.13671875, -40.626953125, -37.1171875, -33.607421875, -30.09765625, -26.587890625, -23.078125, -19.568359375, -16.05859375, -12.548828125, -9.0390625, -5.529296875, -2.01953125, 1.490234375, 5.0, 8.509765625, 12.01953125, 15.529296875, 19.0390625, 22.548828125, 26.05859375, 29.568359375, 33.078125, 36.587890625, 40.09765625, 43.607421875, 47.1171875, 50.626953125, 54.13671875, 57.646484375, 61.15625, 64.666015625, 68.17578125, 71.685546875, 75.1953125, 78.705078125, 82.21484375, 85.724609375, 89.234375, 92.744140625, 96.25390625, 99.763671875, 103.2734375, 106.783203125, 110.29296875, 113.802734375, 117.3125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 10.0, 13.0, 22.0, 19.0, 20.0, 29.0, 35.0, 32.0, 57.0, 56.0, 87.0, 189.0, 439.0, 1039.0, 927.0, 489.0, 192.0, 102.0, 66.0, 42.0, 30.0, 28.0, 23.0, 11.0, 26.0, 13.0, 7.0, 13.0, 6.0, 2.0, 7.0, 2.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.0, -36.77294921875, -35.5458984375, -34.31884765625, -33.091796875, -31.86474609375, -30.6376953125, -29.41064453125, -28.18359375, -26.95654296875, -25.7294921875, -24.50244140625, -23.275390625, -22.04833984375, -20.8212890625, -19.59423828125, -18.3671875, -17.14013671875, -15.9130859375, -14.68603515625, -13.458984375, -12.23193359375, -11.0048828125, -9.77783203125, -8.55078125, -7.32373046875, -6.0966796875, -4.86962890625, -3.642578125, -2.41552734375, -1.1884765625, 0.03857421875, 1.265625, 2.49267578125, 3.7197265625, 4.94677734375, 6.173828125, 7.40087890625, 8.6279296875, 9.85498046875, 11.08203125, 12.30908203125, 13.5361328125, 14.76318359375, 15.990234375, 17.21728515625, 18.4443359375, 19.67138671875, 20.8984375, 22.12548828125, 23.3525390625, 24.57958984375, 25.806640625, 27.03369140625, 28.2607421875, 29.48779296875, 30.71484375, 31.94189453125, 33.1689453125, 34.39599609375, 35.623046875, 36.85009765625, 38.0771484375, 39.30419921875, 40.53125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 6.0, 10.0, 8.0, 18.0, 14.0, 23.0, 28.0, 37.0, 53.0, 71.0, 76.0, 82.0, 129.0, 175.0, 280.0, 496.0, 1232.0, 5414.0, 40811.0, 3830796.0, 292463.0, 17032.0, 2993.0, 821.0, 371.0, 210.0, 128.0, 105.0, 82.0, 67.0, 48.0, 45.0, 31.0, 22.0, 24.0, 10.0, 14.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-108.3125, -105.0107421875, -101.708984375, -98.4072265625, -95.10546875, -91.8037109375, -88.501953125, -85.2001953125, -81.8984375, -78.5966796875, -75.294921875, -71.9931640625, -68.69140625, -65.3896484375, -62.087890625, -58.7861328125, -55.484375, -52.1826171875, -48.880859375, -45.5791015625, -42.27734375, -38.9755859375, -35.673828125, -32.3720703125, -29.0703125, -25.7685546875, -22.466796875, -19.1650390625, -15.86328125, -12.5615234375, -9.259765625, -5.9580078125, -2.65625, 0.6455078125, 3.947265625, 7.2490234375, 10.55078125, 13.8525390625, 17.154296875, 20.4560546875, 23.7578125, 27.0595703125, 30.361328125, 33.6630859375, 36.96484375, 40.2666015625, 43.568359375, 46.8701171875, 50.171875, 53.4736328125, 56.775390625, 60.0771484375, 63.37890625, 66.6806640625, 69.982421875, 73.2841796875, 76.5859375, 79.8876953125, 83.189453125, 86.4912109375, 89.79296875, 93.0947265625, 96.396484375, 99.6982421875, 103.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 32.0, 28.0, 87.0, 247.0, 436.0, 126.0, 27.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-182.33505249023438, -174.4733428955078, -166.61163330078125, -158.74990844726562, -150.88819885253906, -143.0264892578125, -135.16477966308594, -127.30306243896484, -119.44134521484375, -111.57963562011719, -103.7179183959961, -95.85620880126953, -87.99449157714844, -80.13278198242188, -72.27107238769531, -64.40935516357422, -56.547645568847656, -48.68593215942383, -40.82421875, -32.96250915527344, -25.100793838500977, -17.23908233642578, -9.377368927001953, -1.515655517578125, 6.346057891845703, 14.207771301269531, 22.06948471069336, 29.931196212768555, 37.79290771484375, 45.65462112426758, 53.516334533691406, 61.378047943115234, 69.23976135253906, 77.10147094726562, 84.96318817138672, 92.82489776611328, 100.68661499023438, 108.54832458496094, 116.4100341796875, 124.2717514038086, 132.1334686279297, 139.99517822265625, 147.8568878173828, 155.71861267089844, 163.580322265625, 171.44203186035156, 179.30374145507812, 187.16546630859375, 195.02716064453125, 202.8888702392578, 210.75057983398438, 218.6123046875, 226.47401428222656, 234.33572387695312, 242.1974334716797, 250.05914306640625, 257.9208679199219, 265.7825927734375, 273.644287109375, 281.5060119628906, 289.3677062988281, 297.22943115234375, 305.0911560058594, 312.9528503417969, 320.8145751953125]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 13.0, 9.0, 15.0, 17.0, 19.0, 35.0, 24.0, 34.0, 32.0, 41.0, 29.0, 41.0, 39.0, 47.0, 45.0, 45.0, 40.0, 41.0, 40.0, 35.0, 36.0, 45.0, 33.0, 26.0, 21.0, 38.0, 20.0, 20.0, 17.0, 8.0, 11.0, 10.0, 8.0, 3.0, 11.0, 6.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.60552978515625, -139.92665100097656, -135.24777221679688, -130.5688934326172, -125.89002227783203, -121.21114349365234, -116.53227233886719, -111.8533935546875, -107.17451477050781, -102.49563598632812, -97.81675720214844, -93.13788604736328, -88.4590072631836, -83.7801284790039, -79.10125732421875, -74.42237854003906, -69.74349975585938, -65.06462097167969, -60.385746002197266, -55.706871032714844, -51.027992248535156, -46.34911346435547, -41.67023849487305, -36.991363525390625, -32.31248474121094, -27.633607864379883, -22.954730987548828, -18.275854110717773, -13.596977233886719, -8.918100357055664, -4.239223480224609, 0.4396514892578125, 5.1185302734375, 9.797407150268555, 14.47628402709961, 19.155160903930664, 23.83403778076172, 28.512914657592773, 33.19179153442383, 37.87066650390625, 42.54954528808594, 47.228424072265625, 51.90729904174805, 56.58617401123047, 61.265052795410156, 65.94393157958984, 70.622802734375, 75.30168151855469, 79.98056030273438, 84.65943908691406, 89.33831787109375, 94.0171890258789, 98.6960678100586, 103.37494659423828, 108.05381774902344, 112.73269653320312, 117.41157531738281, 122.0904541015625, 126.76933288574219, 131.44821166992188, 136.1270751953125, 140.8059539794922, 145.48483276367188, 150.16371154785156, 154.84259033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 12.0, 7.0, 14.0, 27.0, 34.0, 32.0, 72.0, 101.0, 167.0, 251.0, 349.0, 549.0, 899.0, 1281.0, 2107.0, 3302.0, 5285.0, 8595.0, 14270.0, 24499.0, 45156.0, 91610.0, 220269.0, 345453.0, 139140.0, 63874.0, 33210.0, 18630.0, 11075.0, 6694.0, 4237.0, 2608.0, 1642.0, 1056.0, 724.0, 435.0, 307.0, 176.0, 145.0, 83.0, 59.0, 34.0, 23.0, 15.0, 18.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2097492218017578, -0.20257949829101562, -0.19540977478027344, -0.18824005126953125, -0.18107032775878906, -0.17390060424804688, -0.1667308807373047, -0.1595611572265625, -0.1523914337158203, -0.14522171020507812, -0.13805198669433594, -0.13088226318359375, -0.12371253967285156, -0.11654281616210938, -0.10937309265136719, -0.102203369140625, -0.09503364562988281, -0.08786392211914062, -0.08069419860839844, -0.07352447509765625, -0.06635475158691406, -0.059185028076171875, -0.05201530456542969, -0.0448455810546875, -0.03767585754394531, -0.030506134033203125, -0.023336410522460938, -0.01616668701171875, -0.008996963500976562, -0.001827239990234375, 0.0053424835205078125, 0.01251220703125, 0.019681930541992188, 0.026851654052734375, 0.03402137756347656, 0.04119110107421875, 0.04836082458496094, 0.055530548095703125, 0.06270027160644531, 0.0698699951171875, 0.07703971862792969, 0.08420944213867188, 0.09137916564941406, 0.09854888916015625, 0.10571861267089844, 0.11288833618164062, 0.12005805969238281, 0.127227783203125, 0.1343975067138672, 0.14156723022460938, 0.14873695373535156, 0.15590667724609375, 0.16307640075683594, 0.17024612426757812, 0.1774158477783203, 0.1845855712890625, 0.1917552947998047, 0.19892501831054688, 0.20609474182128906, 0.21326446533203125, 0.22043418884277344, 0.22760391235351562, 0.2347736358642578, 0.241943359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 5.0, 11.0, 9.0, 11.0, 10.0, 17.0, 15.0, 17.0, 39.0, 33.0, 32.0, 27.0, 39.0, 32.0, 42.0, 39.0, 41.0, 1076.0, 44.0, 38.0, 35.0, 56.0, 32.0, 27.0, 36.0, 36.0, 36.0, 30.0, 24.0, 20.0, 18.0, 15.0, 5.0, 13.0, 10.0, 9.0, 12.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.83203125, -3.71209716796875, -3.5921630859375, -3.47222900390625, -3.352294921875, -3.23236083984375, -3.1124267578125, -2.99249267578125, -2.87255859375, -2.75262451171875, -2.6326904296875, -2.51275634765625, -2.392822265625, -2.27288818359375, -2.1529541015625, -2.03302001953125, -1.9130859375, -1.79315185546875, -1.6732177734375, -1.55328369140625, -1.433349609375, -1.31341552734375, -1.1934814453125, -1.07354736328125, -0.95361328125, -0.83367919921875, -0.7137451171875, -0.59381103515625, -0.473876953125, -0.35394287109375, -0.2340087890625, -0.11407470703125, 0.005859375, 0.12579345703125, 0.2457275390625, 0.36566162109375, 0.485595703125, 0.60552978515625, 0.7254638671875, 0.84539794921875, 0.96533203125, 1.08526611328125, 1.2052001953125, 1.32513427734375, 1.445068359375, 1.56500244140625, 1.6849365234375, 1.80487060546875, 1.9248046875, 2.04473876953125, 2.1646728515625, 2.28460693359375, 2.404541015625, 2.52447509765625, 2.6444091796875, 2.76434326171875, 2.88427734375, 3.00421142578125, 3.1241455078125, 3.24407958984375, 3.364013671875, 3.48394775390625, 3.6038818359375, 3.72381591796875, 3.84375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 6.0, 20.0, 23.0, 19.0, 32.0, 61.0, 103.0, 202.0, 247.0, 416.0, 651.0, 1078.0, 1692.0, 2530.0, 3929.0, 6618.0, 10139.0, 16359.0, 26951.0, 43944.0, 73001.0, 123554.0, 295003.0, 1173434.0, 125691.0, 74704.0, 44797.0, 27022.0, 16652.0, 10456.0, 6455.0, 4041.0, 2647.0, 1655.0, 1177.0, 669.0, 407.0, 248.0, 177.0, 96.0, 63.0, 56.0, 33.0, 18.0, 15.0, 16.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.07220458984375, -0.07001781463623047, -0.06783103942871094, -0.0656442642211914, -0.06345748901367188, -0.061270713806152344, -0.05908393859863281, -0.05689716339111328, -0.05471038818359375, -0.05252361297607422, -0.05033683776855469, -0.048150062561035156, -0.045963287353515625, -0.043776512145996094, -0.04158973693847656, -0.03940296173095703, -0.0372161865234375, -0.03502941131591797, -0.03284263610839844, -0.030655860900878906, -0.028469085693359375, -0.026282310485839844, -0.024095535278320312, -0.02190876007080078, -0.01972198486328125, -0.01753520965576172, -0.015348434448242188, -0.013161659240722656, -0.010974884033203125, -0.008788108825683594, -0.0066013336181640625, -0.004414558410644531, -0.002227783203125, -4.100799560546875e-05, 0.0021457672119140625, 0.004332542419433594, 0.006519317626953125, 0.008706092834472656, 0.010892868041992188, 0.013079643249511719, 0.01526641845703125, 0.01745319366455078, 0.019639968872070312, 0.021826744079589844, 0.024013519287109375, 0.026200294494628906, 0.028387069702148438, 0.03057384490966797, 0.0327606201171875, 0.03494739532470703, 0.03713417053222656, 0.039320945739746094, 0.041507720947265625, 0.043694496154785156, 0.04588127136230469, 0.04806804656982422, 0.05025482177734375, 0.05244159698486328, 0.05462837219238281, 0.056815147399902344, 0.059001922607421875, 0.061188697814941406, 0.06337547302246094, 0.06556224822998047, 0.0677490234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 15.0, 22.0, 28.0, 20.0, 20.0, 39.0, 54.0, 57.0, 48.0, 71.0, 92.0, 79.0, 69.0, 71.0, 44.0, 47.0, 42.0, 32.0, 16.0, 20.0, 12.0, 20.0, 8.0, 9.0, 11.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015306472778320312, -0.00014693289995193481, -0.0001408010721206665, -0.0001346692442893982, -0.00012853741645812988, -0.00012240558862686157, -0.00011627376079559326, -0.00011014193296432495, -0.00010401010513305664, -9.787827730178833e-05, -9.174644947052002e-05, -8.561462163925171e-05, -7.94827938079834e-05, -7.335096597671509e-05, -6.721913814544678e-05, -6.108731031417847e-05, -5.4955482482910156e-05, -4.8823654651641846e-05, -4.2691826820373535e-05, -3.6559998989105225e-05, -3.0428171157836914e-05, -2.4296343326568604e-05, -1.8164515495300293e-05, -1.2032687664031982e-05, -5.900859832763672e-06, 2.3096799850463867e-07, 6.362795829772949e-06, 1.249462366104126e-05, 1.862645149230957e-05, 2.475827932357788e-05, 3.089010715484619e-05, 3.70219349861145e-05, 4.315376281738281e-05, 4.928559064865112e-05, 5.5417418479919434e-05, 6.154924631118774e-05, 6.768107414245605e-05, 7.381290197372437e-05, 7.994472980499268e-05, 8.607655763626099e-05, 9.22083854675293e-05, 9.834021329879761e-05, 0.00010447204113006592, 0.00011060386896133423, 0.00011673569679260254, 0.00012286752462387085, 0.00012899935245513916, 0.00013513118028640747, 0.00014126300811767578, 0.0001473948359489441, 0.0001535266637802124, 0.0001596584916114807, 0.00016579031944274902, 0.00017192214727401733, 0.00017805397510528564, 0.00018418580293655396, 0.00019031763076782227, 0.00019644945859909058, 0.0002025812864303589, 0.0002087131142616272, 0.0002148449420928955, 0.00022097676992416382, 0.00022710859775543213, 0.00023324042558670044, 0.00023937225341796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 15.0, 16.0, 28.0, 33.0, 37.0, 68.0, 77.0, 91.0, 108.0, 180.0, 256.0, 399.0, 1135.0, 1041621.0, 2885.0, 497.0, 285.0, 224.0, 157.0, 75.0, 82.0, 64.0, 54.0, 28.0, 39.0, 29.0, 15.0, 15.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004215240478515625, -0.004086136817932129, -0.003957033157348633, -0.0038279294967651367, -0.0036988258361816406, -0.0035697221755981445, -0.0034406185150146484, -0.0033115148544311523, -0.0031824111938476562, -0.00305330753326416, -0.002924203872680664, -0.002795100212097168, -0.002665996551513672, -0.0025368928909301758, -0.0024077892303466797, -0.0022786855697631836, -0.0021495819091796875, -0.0020204782485961914, -0.0018913745880126953, -0.0017622709274291992, -0.0016331672668457031, -0.001504063606262207, -0.001374959945678711, -0.0012458562850952148, -0.0011167526245117188, -0.0009876489639282227, -0.0008585453033447266, -0.0007294416427612305, -0.0006003379821777344, -0.0004712343215942383, -0.0003421306610107422, -0.0002130270004272461, -8.392333984375e-05, 4.5180320739746094e-05, 0.0001742839813232422, 0.0003033876419067383, 0.0004324913024902344, 0.0005615949630737305, 0.0006906986236572266, 0.0008198022842407227, 0.0009489059448242188, 0.0010780096054077148, 0.001207113265991211, 0.001336216926574707, 0.0014653205871582031, 0.0015944242477416992, 0.0017235279083251953, 0.0018526315689086914, 0.0019817352294921875, 0.0021108388900756836, 0.0022399425506591797, 0.0023690462112426758, 0.002498149871826172, 0.002627253532409668, 0.002756357192993164, 0.00288546085357666, 0.0030145645141601562, 0.0031436681747436523, 0.0032727718353271484, 0.0034018754959106445, 0.0035309791564941406, 0.0036600828170776367, 0.003789186477661133, 0.003918290138244629, 0.004047393798828125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.665895928861573e-05, 2.276245504617691e-05, 8.218386938096955e-05, 0.00014160529826767743, 0.00020102670532651246, 0.0002604481123853475, 0.00031986954854801297, 0.000379290955606848, 0.00043871236266568303, 0.0004981337697245181, 0.0005575551767833531, 0.000616976642049849, 0.0006763980491086841, 0.0007358194561675191, 0.0007952408632263541, 0.0008546622702851892, 0.0009140836773440242, 0.0009735050844028592, 0.0010329264914616942, 0.0010923478985205293, 0.0011517693055793643, 0.0012111907126381993, 0.0012706122361123562, 0.0013300336431711912, 0.0013894549338147044, 0.0014488763408735394, 0.0015082977479323745, 0.0015677191549912095, 0.0016271405620500445, 0.0016865619691088796, 0.0017459834925830364, 0.0018054048996418715, 0.0018648263067007065, 0.0019242477137595415, 0.0019836691208183765, 0.0020430905278772116, 0.0021025119349360466, 0.0021619333419948816, 0.0022213547490537167, 0.0022807761561125517, 0.0023401975631713867, 0.0023996189702302217, 0.0024590403772890568, 0.002518461784347892, 0.002577883191406727, 0.002637304598465562, 0.002696726005524397, 0.002756147412583232, 0.002815568819642067, 0.002874990226700902, 0.002934411633759737, 0.002993833040818572, 0.003053254447877407, 0.003112675854936242, 0.003172097261995077, 0.003231518669053912, 0.003290940308943391, 0.003350361716002226, 0.003409783123061061, 0.003469204530119896, 0.003528625937178731, 0.003588047344237566, 0.003647468751296401, 0.003706890158355236, 0.003766311565414071]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 15.0, 11.0, 22.0, 27.0, 40.0, 53.0, 48.0, 77.0, 82.0, 97.0, 58.0, 94.0, 76.0, 69.0, 56.0, 47.0, 35.0, 30.0, 18.0, 9.0, 12.0, 15.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001519322395324707, -0.00014598481357097626, -0.0001400373876094818, -0.00013408996164798737, -0.00012814253568649292, -0.00012219510972499847, -0.00011624768376350403, -0.00011030025780200958, -0.00010435283184051514, -9.840540587902069e-05, -9.245797991752625e-05, -8.65105539560318e-05, -8.056312799453735e-05, -7.461570203304291e-05, -6.866827607154846e-05, -6.272085011005402e-05, -5.677342414855957e-05, -5.0825998187065125e-05, -4.487857222557068e-05, -3.893114626407623e-05, -3.298372030258179e-05, -2.703629434108734e-05, -2.1088868379592896e-05, -1.514144241809845e-05, -9.194016456604004e-06, -3.246590495109558e-06, 2.7008354663848877e-06, 8.648261427879333e-06, 1.459568738937378e-05, 2.0543113350868225e-05, 2.649053931236267e-05, 3.243796527385712e-05, 3.838539123535156e-05, 4.433281719684601e-05, 5.0280243158340454e-05, 5.62276691198349e-05, 6.217509508132935e-05, 6.812252104282379e-05, 7.406994700431824e-05, 8.001737296581268e-05, 8.596479892730713e-05, 9.191222488880157e-05, 9.785965085029602e-05, 0.00010380707681179047, 0.00010975450277328491, 0.00011570192873477936, 0.0001216493546962738, 0.00012759678065776825, 0.0001335442066192627, 0.00013949163258075714, 0.0001454390585422516, 0.00015138648450374603, 0.00015733391046524048, 0.00016328133642673492, 0.00016922876238822937, 0.00017517618834972382, 0.00018112361431121826, 0.0001870710402727127, 0.00019301846623420715, 0.0001989658921957016, 0.00020491331815719604, 0.0002108607441186905, 0.00021680817008018494, 0.00022275559604167938, 0.00022870302200317383]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 11.0, 17.0, 15.0, 33.0, 41.0, 53.0, 87.0, 105.0, 157.0, 181.0, 264.0, 365.0, 500.0, 749.0, 1109.0, 1650.0, 2760.0, 4670.0, 8910.0, 20372.0, 65274.0, 728714.0, 152277.0, 31795.0, 12404.0, 6218.0, 3351.0, 2094.0, 1351.0, 917.0, 573.0, 436.0, 290.0, 207.0, 177.0, 110.0, 87.0, 70.0, 42.0, 37.0, 27.0, 16.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.625, -37.36767578125, -36.1103515625, -34.85302734375, -33.595703125, -32.33837890625, -31.0810546875, -29.82373046875, -28.56640625, -27.30908203125, -26.0517578125, -24.79443359375, -23.537109375, -22.27978515625, -21.0224609375, -19.76513671875, -18.5078125, -17.25048828125, -15.9931640625, -14.73583984375, -13.478515625, -12.22119140625, -10.9638671875, -9.70654296875, -8.44921875, -7.19189453125, -5.9345703125, -4.67724609375, -3.419921875, -2.16259765625, -0.9052734375, 0.35205078125, 1.609375, 2.86669921875, 4.1240234375, 5.38134765625, 6.638671875, 7.89599609375, 9.1533203125, 10.41064453125, 11.66796875, 12.92529296875, 14.1826171875, 15.43994140625, 16.697265625, 17.95458984375, 19.2119140625, 20.46923828125, 21.7265625, 22.98388671875, 24.2412109375, 25.49853515625, 26.755859375, 28.01318359375, 29.2705078125, 30.52783203125, 31.78515625, 33.04248046875, 34.2998046875, 35.55712890625, 36.814453125, 38.07177734375, 39.3291015625, 40.58642578125, 41.84375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 11.0, 27.0, 24.0, 21.0, 26.0, 20.0, 29.0, 28.0, 36.0, 44.0, 46.0, 44.0, 59.0, 105.0, 281.0, 1538.0, 154.0, 86.0, 57.0, 32.0, 49.0, 31.0, 27.0, 35.0, 31.0, 27.0, 19.0, 21.0, 19.0, 11.0, 12.0, 10.0, 4.0, 5.0, 7.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.21875, -25.40380859375, -24.5888671875, -23.77392578125, -22.958984375, -22.14404296875, -21.3291015625, -20.51416015625, -19.69921875, -18.88427734375, -18.0693359375, -17.25439453125, -16.439453125, -15.62451171875, -14.8095703125, -13.99462890625, -13.1796875, -12.36474609375, -11.5498046875, -10.73486328125, -9.919921875, -9.10498046875, -8.2900390625, -7.47509765625, -6.66015625, -5.84521484375, -5.0302734375, -4.21533203125, -3.400390625, -2.58544921875, -1.7705078125, -0.95556640625, -0.140625, 0.67431640625, 1.4892578125, 2.30419921875, 3.119140625, 3.93408203125, 4.7490234375, 5.56396484375, 6.37890625, 7.19384765625, 8.0087890625, 8.82373046875, 9.638671875, 10.45361328125, 11.2685546875, 12.08349609375, 12.8984375, 13.71337890625, 14.5283203125, 15.34326171875, 16.158203125, 16.97314453125, 17.7880859375, 18.60302734375, 19.41796875, 20.23291015625, 21.0478515625, 21.86279296875, 22.677734375, 23.49267578125, 24.3076171875, 25.12255859375, 25.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 11.0, 13.0, 18.0, 18.0, 22.0, 35.0, 32.0, 45.0, 87.0, 114.0, 203.0, 562.0, 4534.0, 2598080.0, 537207.0, 3519.0, 475.0, 201.0, 118.0, 77.0, 56.0, 33.0, 34.0, 25.0, 23.0, 21.0, 20.0, 16.0, 11.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.0029296875, -99.318359375, -95.6337890625, -91.94921875, -88.2646484375, -84.580078125, -80.8955078125, -77.2109375, -73.5263671875, -69.841796875, -66.1572265625, -62.47265625, -58.7880859375, -55.103515625, -51.4189453125, -47.734375, -44.0498046875, -40.365234375, -36.6806640625, -32.99609375, -29.3115234375, -25.626953125, -21.9423828125, -18.2578125, -14.5732421875, -10.888671875, -7.2041015625, -3.51953125, 0.1650390625, 3.849609375, 7.5341796875, 11.21875, 14.9033203125, 18.587890625, 22.2724609375, 25.95703125, 29.6416015625, 33.326171875, 37.0107421875, 40.6953125, 44.3798828125, 48.064453125, 51.7490234375, 55.43359375, 59.1181640625, 62.802734375, 66.4873046875, 70.171875, 73.8564453125, 77.541015625, 81.2255859375, 84.91015625, 88.5947265625, 92.279296875, 95.9638671875, 99.6484375, 103.3330078125, 107.017578125, 110.7021484375, 114.38671875, 118.0712890625, 121.755859375, 125.4404296875, 129.125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 305.0, 468.0, 138.0, 32.0, 17.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-177.86587524414062, -172.7935791015625, -167.7212677001953, -162.64895629882812, -157.57666015625, -152.50436401367188, -147.4320526123047, -142.3597412109375, -137.28744506835938, -132.21514892578125, -127.14283752441406, -122.0705337524414, -116.99822998046875, -111.9259262084961, -106.85362243652344, -101.78131866455078, -96.70901489257812, -91.63671112060547, -86.56440734863281, -81.49210357666016, -76.4197998046875, -71.34749603271484, -66.27519226074219, -61.20288848876953, -56.130584716796875, -51.05828094482422, -45.98597717285156, -40.913673400878906, -35.84136962890625, -30.769065856933594, -25.696762084960938, -20.62445831298828, -15.552154541015625, -10.479850769042969, -5.4075469970703125, -0.33524322509765625, 4.737060546875, 9.809364318847656, 14.881668090820312, 19.95397186279297, 25.026275634765625, 30.09857940673828, 35.17088317871094, 40.243186950683594, 45.31549072265625, 50.387794494628906, 55.46009826660156, 60.53240203857422, 65.60470581054688, 70.67700958251953, 75.74931335449219, 80.82161712646484, 85.8939208984375, 90.96622467041016, 96.03852844238281, 101.11083221435547, 106.18313598632812, 111.25543975830078, 116.32774353027344, 121.4000473022461, 126.47235107421875, 131.54464721679688, 136.61695861816406, 141.68927001953125, 146.76156616210938]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 9.0, 11.0, 12.0, 18.0, 17.0, 28.0, 32.0, 31.0, 37.0, 45.0, 52.0, 49.0, 46.0, 61.0, 54.0, 65.0, 51.0, 52.0, 49.0, 55.0, 35.0, 30.0, 42.0, 28.0, 23.0, 14.0, 17.0, 9.0, 6.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.12557983398438, -114.09078216552734, -110.05598449707031, -106.02118682861328, -101.98638916015625, -97.95159149169922, -93.91679382324219, -89.88199615478516, -85.84719848632812, -81.8124008178711, -77.77760314941406, -73.74280548095703, -69.7080078125, -65.67321014404297, -61.63841247558594, -57.603614807128906, -53.568817138671875, -49.534019470214844, -45.49922180175781, -41.46442413330078, -37.42962646484375, -33.39482879638672, -29.360031127929688, -25.325233459472656, -21.290435791015625, -17.255638122558594, -13.220840454101562, -9.186042785644531, -5.1512451171875, -1.1164474487304688, 2.9183502197265625, 6.953147888183594, 10.987945556640625, 15.022743225097656, 19.057540893554688, 23.09233856201172, 27.12713623046875, 31.16193389892578, 35.19673156738281, 39.231529235839844, 43.266326904296875, 47.301124572753906, 51.33592224121094, 55.37071990966797, 59.405517578125, 63.44031524658203, 67.47511291503906, 71.5099105834961, 75.54470825195312, 79.57950592041016, 83.61430358886719, 87.64910125732422, 91.68389892578125, 95.71869659423828, 99.75349426269531, 103.78829193115234, 107.82308959960938, 111.8578872680664, 115.89268493652344, 119.92748260498047, 123.9622802734375, 127.99707794189453, 132.03187561035156, 136.06668090820312, 140.10147094726562]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 17.0, 7.0, 12.0, 7.0, 6.0, 11.0, 16.0, 21.0, 18.0, 14.0, 26.0, 35.0, 39.0, 57.0, 76.0, 85.0, 66.0, 83.0, 73.0, 51.0, 43.0, 27.0, 36.0, 22.0, 13.0, 23.0, 17.0, 15.0, 7.0, 10.0, 7.0, 9.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.409912109375, -8.09326171875, -7.776611328125, -7.4599609375, -7.143310546875, -6.82666015625, -6.510009765625, -6.193359375, -5.876708984375, -5.56005859375, -5.243408203125, -4.9267578125, -4.610107421875, -4.29345703125, -3.976806640625, -3.66015625, -3.343505859375, -3.02685546875, -2.710205078125, -2.3935546875, -2.076904296875, -1.76025390625, -1.443603515625, -1.126953125, -0.810302734375, -0.49365234375, -0.177001953125, 0.1396484375, 0.456298828125, 0.77294921875, 1.089599609375, 1.40625, 1.722900390625, 2.03955078125, 2.356201171875, 2.6728515625, 2.989501953125, 3.30615234375, 3.622802734375, 3.939453125, 4.256103515625, 4.57275390625, 4.889404296875, 5.2060546875, 5.522705078125, 5.83935546875, 6.156005859375, 6.47265625, 6.789306640625, 7.10595703125, 7.422607421875, 7.7392578125, 8.055908203125, 8.37255859375, 8.689208984375, 9.005859375, 9.322509765625, 9.63916015625, 9.955810546875, 10.2724609375, 10.589111328125, 10.90576171875, 11.222412109375, 11.5390625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 14.0, 9.0, 9.0, 22.0, 13.0, 22.0, 46.0, 44.0, 88.0, 110.0, 220.0, 316.0, 607.0, 1356.0, 3679.0, 17056.0, 3957117.0, 201234.0, 7942.0, 2257.0, 905.0, 415.0, 273.0, 170.0, 103.0, 50.0, 51.0, 25.0, 27.0, 20.0, 10.0, 9.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -76.6982421875, -73.833984375, -70.9697265625, -68.10546875, -65.2412109375, -62.376953125, -59.5126953125, -56.6484375, -53.7841796875, -50.919921875, -48.0556640625, -45.19140625, -42.3271484375, -39.462890625, -36.5986328125, -33.734375, -30.8701171875, -28.005859375, -25.1416015625, -22.27734375, -19.4130859375, -16.548828125, -13.6845703125, -10.8203125, -7.9560546875, -5.091796875, -2.2275390625, 0.63671875, 3.5009765625, 6.365234375, 9.2294921875, 12.09375, 14.9580078125, 17.822265625, 20.6865234375, 23.55078125, 26.4150390625, 29.279296875, 32.1435546875, 35.0078125, 37.8720703125, 40.736328125, 43.6005859375, 46.46484375, 49.3291015625, 52.193359375, 55.0576171875, 57.921875, 60.7861328125, 63.650390625, 66.5146484375, 69.37890625, 72.2431640625, 75.107421875, 77.9716796875, 80.8359375, 83.7001953125, 86.564453125, 89.4287109375, 92.29296875, 95.1572265625, 98.021484375, 100.8857421875, 103.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 2.0, 5.0, 6.0, 11.0, 9.0, 9.0, 13.0, 17.0, 33.0, 25.0, 38.0, 74.0, 125.0, 283.0, 601.0, 1021.0, 816.0, 403.0, 200.0, 95.0, 58.0, 41.0, 35.0, 20.0, 19.0, 16.0, 13.0, 11.0, 9.0, 8.0, 3.0, 4.0, 6.0, 8.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.4375, -28.537353515625, -27.63720703125, -26.737060546875, -25.8369140625, -24.936767578125, -24.03662109375, -23.136474609375, -22.236328125, -21.336181640625, -20.43603515625, -19.535888671875, -18.6357421875, -17.735595703125, -16.83544921875, -15.935302734375, -15.03515625, -14.135009765625, -13.23486328125, -12.334716796875, -11.4345703125, -10.534423828125, -9.63427734375, -8.734130859375, -7.833984375, -6.933837890625, -6.03369140625, -5.133544921875, -4.2333984375, -3.333251953125, -2.43310546875, -1.532958984375, -0.6328125, 0.267333984375, 1.16748046875, 2.067626953125, 2.9677734375, 3.867919921875, 4.76806640625, 5.668212890625, 6.568359375, 7.468505859375, 8.36865234375, 9.268798828125, 10.1689453125, 11.069091796875, 11.96923828125, 12.869384765625, 13.76953125, 14.669677734375, 15.56982421875, 16.469970703125, 17.3701171875, 18.270263671875, 19.17041015625, 20.070556640625, 20.970703125, 21.870849609375, 22.77099609375, 23.671142578125, 24.5712890625, 25.471435546875, 26.37158203125, 27.271728515625, 28.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 10.0, 6.0, 6.0, 11.0, 18.0, 21.0, 47.0, 46.0, 88.0, 136.0, 243.0, 485.0, 1025.0, 2727.0, 8026.0, 27596.0, 244579.0, 3791552.0, 91075.0, 17483.0, 5495.0, 1907.0, 751.0, 365.0, 199.0, 117.0, 69.0, 56.0, 34.0, 23.0, 18.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.75, -60.86767578125, -58.9853515625, -57.10302734375, -55.220703125, -53.33837890625, -51.4560546875, -49.57373046875, -47.69140625, -45.80908203125, -43.9267578125, -42.04443359375, -40.162109375, -38.27978515625, -36.3974609375, -34.51513671875, -32.6328125, -30.75048828125, -28.8681640625, -26.98583984375, -25.103515625, -23.22119140625, -21.3388671875, -19.45654296875, -17.57421875, -15.69189453125, -13.8095703125, -11.92724609375, -10.044921875, -8.16259765625, -6.2802734375, -4.39794921875, -2.515625, -0.63330078125, 1.2490234375, 3.13134765625, 5.013671875, 6.89599609375, 8.7783203125, 10.66064453125, 12.54296875, 14.42529296875, 16.3076171875, 18.18994140625, 20.072265625, 21.95458984375, 23.8369140625, 25.71923828125, 27.6015625, 29.48388671875, 31.3662109375, 33.24853515625, 35.130859375, 37.01318359375, 38.8955078125, 40.77783203125, 42.66015625, 44.54248046875, 46.4248046875, 48.30712890625, 50.189453125, 52.07177734375, 53.9541015625, 55.83642578125, 57.71875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 41.0, 203.0, 579.0, 122.0, 37.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.17376708984375, -286.0932312011719, -276.0126953125, -265.93212890625, -255.85159301757812, -245.77105712890625, -235.6905059814453, -225.60995483398438, -215.5294189453125, -205.44888305664062, -195.3683319091797, -185.28778076171875, -175.20724487304688, -165.126708984375, -155.04615783691406, -144.96560668945312, -134.88507080078125, -124.80452728271484, -114.72398376464844, -104.64344024658203, -94.56289672851562, -84.48235321044922, -74.40180969238281, -64.3212661743164, -54.24072265625, -44.160179138183594, -34.07963562011719, -23.99909210205078, -13.918548583984375, -3.8380050659179688, 6.2425384521484375, 16.323081970214844, 26.403656005859375, 36.48419952392578, 46.56474304199219, 56.645286560058594, 66.725830078125, 76.8063735961914, 86.88691711425781, 96.96746063232422, 107.04800415039062, 117.12854766845703, 127.20909118652344, 137.28964233398438, 147.37017822265625, 157.45071411132812, 167.53126525878906, 177.61181640625, 187.69235229492188, 197.77288818359375, 207.8534393310547, 217.93399047851562, 228.0145263671875, 238.09506225585938, 248.1756134033203, 258.25616455078125, 268.3367004394531, 278.417236328125, 288.497802734375, 298.5783386230469, 308.65887451171875, 318.7394104003906, 328.8199462890625, 338.9005126953125, 348.9810485839844]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 16.0, 24.0, 23.0, 26.0, 30.0, 39.0, 38.0, 41.0, 50.0, 48.0, 44.0, 44.0, 48.0, 40.0, 35.0, 38.0, 42.0, 41.0, 34.0, 23.0, 16.0, 20.0, 18.0, 20.0, 19.0, 23.0, 8.0, 10.0, 13.0, 8.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-89.58663940429688, -86.78866577148438, -83.99069213867188, -81.19271850585938, -78.39474487304688, -75.59677124023438, -72.79879760742188, -70.00081634521484, -67.20284271240234, -64.40486907958984, -61.606895446777344, -58.808921813964844, -56.01094436645508, -53.21297073364258, -50.41499710083008, -47.61701965332031, -44.81904983520508, -42.02107620239258, -39.22310256958008, -36.42512512207031, -33.62715148925781, -30.829177856445312, -28.031204223632812, -25.23322868347168, -22.43525505065918, -19.63728141784668, -16.839305877685547, -14.041332244873047, -11.24335765838623, -8.445383071899414, -5.647409439086914, -2.8494338989257812, -0.05146026611328125, 2.746514081954956, 5.544488430023193, 8.342462539672852, 11.140437126159668, 13.938411712646484, 16.736385345458984, 19.534360885620117, 22.332334518432617, 25.130308151245117, 27.92828369140625, 30.72625732421875, 33.52423095703125, 36.32220458984375, 39.12017822265625, 41.918155670166016, 44.716129302978516, 47.514102935791016, 50.312076568603516, 53.11005401611328, 55.90802764892578, 58.70600128173828, 61.50397491455078, 64.30194854736328, 67.09992218017578, 69.89789581298828, 72.69586944580078, 75.49384307861328, 78.29181671142578, 81.08979797363281, 83.88777160644531, 86.68574523925781, 89.48371887207031]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 9.0, 13.0, 22.0, 30.0, 36.0, 85.0, 112.0, 156.0, 267.0, 395.0, 610.0, 876.0, 1339.0, 2044.0, 3128.0, 4862.0, 7496.0, 11716.0, 19894.0, 34611.0, 64622.0, 130183.0, 278723.0, 240410.0, 111806.0, 56263.0, 30677.0, 17713.0, 10845.0, 6669.0, 4486.0, 2906.0, 1884.0, 1254.0, 816.0, 544.0, 344.0, 235.0, 179.0, 109.0, 58.0, 40.0, 33.0, 18.0, 9.0, 8.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17801284790039062, -0.17243194580078125, -0.16685104370117188, -0.1612701416015625, -0.15568923950195312, -0.15010833740234375, -0.14452743530273438, -0.138946533203125, -0.13336563110351562, -0.12778472900390625, -0.12220382690429688, -0.1166229248046875, -0.11104202270507812, -0.10546112060546875, -0.09988021850585938, -0.09429931640625, -0.08871841430664062, -0.08313751220703125, -0.07755661010742188, -0.0719757080078125, -0.06639480590820312, -0.06081390380859375, -0.055233001708984375, -0.049652099609375, -0.044071197509765625, -0.03849029541015625, -0.032909393310546875, -0.0273284912109375, -0.021747589111328125, -0.01616668701171875, -0.010585784912109375, -0.0050048828125, 0.000576019287109375, 0.00615692138671875, 0.011737823486328125, 0.0173187255859375, 0.022899627685546875, 0.02848052978515625, 0.034061431884765625, 0.039642333984375, 0.045223236083984375, 0.05080413818359375, 0.056385040283203125, 0.0619659423828125, 0.06754684448242188, 0.07312774658203125, 0.07870864868164062, 0.08428955078125, 0.08987045288085938, 0.09545135498046875, 0.10103225708007812, 0.1066131591796875, 0.11219406127929688, 0.11777496337890625, 0.12335586547851562, 0.128936767578125, 0.13451766967773438, 0.14009857177734375, 0.14567947387695312, 0.1512603759765625, 0.15684127807617188, 0.16242218017578125, 0.16800308227539062, 0.173583984375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 11.0, 21.0, 13.0, 19.0, 21.0, 38.0, 25.0, 32.0, 28.0, 42.0, 39.0, 35.0, 30.0, 48.0, 52.0, 1068.0, 47.0, 41.0, 38.0, 43.0, 33.0, 32.0, 36.0, 30.0, 28.0, 30.0, 22.0, 20.0, 13.0, 20.0, 11.0, 7.0, 12.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.043212890625, -3.91064453125, -3.778076171875, -3.6455078125, -3.512939453125, -3.38037109375, -3.247802734375, -3.115234375, -2.982666015625, -2.85009765625, -2.717529296875, -2.5849609375, -2.452392578125, -2.31982421875, -2.187255859375, -2.0546875, -1.922119140625, -1.78955078125, -1.656982421875, -1.5244140625, -1.391845703125, -1.25927734375, -1.126708984375, -0.994140625, -0.861572265625, -0.72900390625, -0.596435546875, -0.4638671875, -0.331298828125, -0.19873046875, -0.066162109375, 0.06640625, 0.198974609375, 0.33154296875, 0.464111328125, 0.5966796875, 0.729248046875, 0.86181640625, 0.994384765625, 1.126953125, 1.259521484375, 1.39208984375, 1.524658203125, 1.6572265625, 1.789794921875, 1.92236328125, 2.054931640625, 2.1875, 2.320068359375, 2.45263671875, 2.585205078125, 2.7177734375, 2.850341796875, 2.98291015625, 3.115478515625, 3.248046875, 3.380615234375, 3.51318359375, 3.645751953125, 3.7783203125, 3.910888671875, 4.04345703125, 4.176025390625, 4.30859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 3.0, 9.0, 10.0, 16.0, 32.0, 42.0, 55.0, 97.0, 124.0, 172.0, 258.0, 349.0, 519.0, 743.0, 1168.0, 1601.0, 2336.0, 3505.0, 4964.0, 7378.0, 10645.0, 15421.0, 23526.0, 34072.0, 49646.0, 73216.0, 112082.0, 177446.0, 1219606.0, 117368.0, 77149.0, 51968.0, 35445.0, 24223.0, 16378.0, 11198.0, 7675.0, 5247.0, 3501.0, 2421.0, 1684.0, 1191.0, 876.0, 524.0, 400.0, 262.0, 193.0, 109.0, 88.0, 78.0, 51.0, 24.0, 9.0, 10.0, 11.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.0557861328125, -0.05398988723754883, -0.052193641662597656, -0.050397396087646484, -0.04860115051269531, -0.04680490493774414, -0.04500865936279297, -0.0432124137878418, -0.041416168212890625, -0.03961992263793945, -0.03782367706298828, -0.03602743148803711, -0.03423118591308594, -0.032434940338134766, -0.030638694763183594, -0.028842449188232422, -0.02704620361328125, -0.025249958038330078, -0.023453712463378906, -0.021657466888427734, -0.019861221313476562, -0.01806497573852539, -0.01626873016357422, -0.014472484588623047, -0.012676239013671875, -0.010879993438720703, -0.009083747863769531, -0.007287502288818359, -0.0054912567138671875, -0.0036950111389160156, -0.0018987655639648438, -0.00010251998901367188, 0.0016937255859375, 0.003489971160888672, 0.005286216735839844, 0.007082462310791016, 0.008878707885742188, 0.01067495346069336, 0.012471199035644531, 0.014267444610595703, 0.016063690185546875, 0.017859935760498047, 0.01965618133544922, 0.02145242691040039, 0.023248672485351562, 0.025044918060302734, 0.026841163635253906, 0.028637409210205078, 0.03043365478515625, 0.03222990036010742, 0.034026145935058594, 0.035822391510009766, 0.03761863708496094, 0.03941488265991211, 0.04121112823486328, 0.04300737380981445, 0.044803619384765625, 0.0465998649597168, 0.04839611053466797, 0.05019235610961914, 0.05198860168457031, 0.053784847259521484, 0.055581092834472656, 0.05737733840942383, 0.059173583984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 5.0, 17.0, 19.0, 26.0, 25.0, 34.0, 35.0, 57.0, 57.0, 85.0, 67.0, 80.0, 72.0, 61.0, 63.0, 66.0, 59.0, 38.0, 30.0, 15.0, 15.0, 13.0, 9.0, 8.0, 6.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.00015756674110889435, -0.0001522935926914215, -0.00014702044427394867, -0.00014174729585647583, -0.000136474147439003, -0.00013120099902153015, -0.0001259278506040573, -0.00012065470218658447, -0.00011538155376911163, -0.0001101084053516388, -0.00010483525693416595, -9.956210851669312e-05, -9.428896009922028e-05, -8.901581168174744e-05, -8.37426632642746e-05, -7.846951484680176e-05, -7.319636642932892e-05, -6.792321801185608e-05, -6.265006959438324e-05, -5.73769211769104e-05, -5.210377275943756e-05, -4.683062434196472e-05, -4.155747592449188e-05, -3.628432750701904e-05, -3.1011179089546204e-05, -2.5738030672073364e-05, -2.0464882254600525e-05, -1.5191733837127686e-05, -9.918585419654846e-06, -4.645437002182007e-06, 6.277114152908325e-07, 5.900859832763672e-06, 1.1174008250236511e-05, 1.644715666770935e-05, 2.172030508518219e-05, 2.699345350265503e-05, 3.226660192012787e-05, 3.753975033760071e-05, 4.281289875507355e-05, 4.808604717254639e-05, 5.3359195590019226e-05, 5.8632344007492065e-05, 6.39054924249649e-05, 6.917864084243774e-05, 7.445178925991058e-05, 7.972493767738342e-05, 8.499808609485626e-05, 9.02712345123291e-05, 9.554438292980194e-05, 0.00010081753134727478, 0.00010609067976474762, 0.00011136382818222046, 0.0001166369765996933, 0.00012191012501716614, 0.00012718327343463898, 0.00013245642185211182, 0.00013772957026958466, 0.0001430027186870575, 0.00014827586710453033, 0.00015354901552200317, 0.000158822163939476, 0.00016409531235694885, 0.0001693684607744217, 0.00017464160919189453]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 14.0, 12.0, 10.0, 18.0, 20.0, 22.0, 42.0, 56.0, 70.0, 80.0, 94.0, 149.0, 227.0, 283.0, 490.0, 4432.0, 1033649.0, 7239.0, 528.0, 272.0, 221.0, 157.0, 140.0, 65.0, 49.0, 53.0, 28.0, 31.0, 18.0, 16.0, 15.0, 9.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0027408599853515625, -0.002651125192642212, -0.0025613903999328613, -0.0024716556072235107, -0.00238192081451416, -0.0022921860218048096, -0.002202451229095459, -0.0021127164363861084, -0.002022981643676758, -0.0019332468509674072, -0.0018435120582580566, -0.001753777265548706, -0.0016640424728393555, -0.0015743076801300049, -0.0014845728874206543, -0.0013948380947113037, -0.0013051033020019531, -0.0012153685092926025, -0.001125633716583252, -0.0010358989238739014, -0.0009461641311645508, -0.0008564293384552002, -0.0007666945457458496, -0.000676959753036499, -0.0005872249603271484, -0.0004974901676177979, -0.00040775537490844727, -0.0003180205821990967, -0.0002282857894897461, -0.0001385509967803955, -4.881620407104492e-05, 4.0918588638305664e-05, 0.00013065338134765625, 0.00022038817405700684, 0.0003101229667663574, 0.000399857759475708, 0.0004895925521850586, 0.0005793273448944092, 0.0006690621376037598, 0.0007587969303131104, 0.0008485317230224609, 0.0009382665157318115, 0.0010280013084411621, 0.0011177361011505127, 0.0012074708938598633, 0.0012972056865692139, 0.0013869404792785645, 0.001476675271987915, 0.0015664100646972656, 0.0016561448574066162, 0.0017458796501159668, 0.0018356144428253174, 0.001925349235534668, 0.0020150840282440186, 0.002104818820953369, 0.0021945536136627197, 0.0022842884063720703, 0.002374023199081421, 0.0024637579917907715, 0.002553492784500122, 0.0026432275772094727, 0.0027329623699188232, 0.002822697162628174, 0.0029124319553375244, 0.003002166748046875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [75.0, 925.0, 16.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.584178921300918e-05, -8.314827937283553e-06, 1.9212133338442072e-05, 4.6739092795178294e-05, 7.426605588989332e-05, 0.00010179301898460835, 0.00012931997480336577, 0.0001568469451740384, 0.00018437390099279583, 0.00021190085681155324, 0.00023942782718222588, 0.00026695476844906807, 0.00029448175337165594, 0.00032200870919041336, 0.00034953566500917077, 0.00037706264993175864, 0.0004045895766466856, 0.000432116532465443, 0.00045964348828420043, 0.0004871704732067883, 0.0005146973999217153, 0.0005422243848443031, 0.000569751369766891, 0.000597278296481818, 0.0006248052814044058, 0.0006523322663269937, 0.0006798591930419207, 0.0007073861779645085, 0.0007349131046794355, 0.0007624400896020234, 0.0007899670163169503, 0.0008174940012395382, 0.0008450209279544652, 0.000872547912877053, 0.00090007483959198, 0.0009276018245145679, 0.0009551287512294948, 0.0009826556779444218, 0.0010101826628670096, 0.0010377096477895975, 0.0010652366327121854, 0.0010927636176347733, 0.0011202906025573611, 0.0011478174710646272, 0.001175344455987215, 0.001202871440909803, 0.0012303984258323908, 0.0012579254107549787, 0.0012854522792622447, 0.0013129792641848326, 0.0013405062491074204, 0.0013680331176146865, 0.0013955601025372744, 0.0014230870874598622, 0.00145061407238245, 0.001478141057305038, 0.0015056680422276258, 0.0015331950271502137, 0.0015607220120728016, 0.0015882488805800676, 0.0016157758655026555, 0.0016433028504252434, 0.0016708298353478312, 0.0016983568202704191, 0.0017258836887776852]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 11.0, 10.0, 11.0, 18.0, 25.0, 18.0, 35.0, 35.0, 41.0, 62.0, 44.0, 34.0, 37.0, 43.0, 53.0, 45.0, 52.0, 46.0, 48.0, 60.0, 42.0, 26.0, 47.0, 33.0, 19.0, 14.0, 13.0, 13.0, 13.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.495019912719727e-05, -9.189825505018234e-05, -8.884631097316742e-05, -8.57943668961525e-05, -8.274242281913757e-05, -7.969047874212265e-05, -7.663853466510773e-05, -7.35865905880928e-05, -7.053464651107788e-05, -6.748270243406296e-05, -6.443075835704803e-05, -6.137881428003311e-05, -5.832687020301819e-05, -5.5274926126003265e-05, -5.222298204898834e-05, -4.917103797197342e-05, -4.6119093894958496e-05, -4.306714981794357e-05, -4.001520574092865e-05, -3.696326166391373e-05, -3.3911317586898804e-05, -3.085937350988388e-05, -2.7807429432868958e-05, -2.4755485355854034e-05, -2.170354127883911e-05, -1.8651597201824188e-05, -1.5599653124809265e-05, -1.2547709047794342e-05, -9.495764970779419e-06, -6.443820893764496e-06, -3.3918768167495728e-06, -3.3993273973464966e-07, 2.7120113372802734e-06, 5.7639554142951965e-06, 8.81589949131012e-06, 1.1867843568325043e-05, 1.4919787645339966e-05, 1.797173172235489e-05, 2.1023675799369812e-05, 2.4075619876384735e-05, 2.7127563953399658e-05, 3.017950803041458e-05, 3.3231452107429504e-05, 3.628339618444443e-05, 3.933534026145935e-05, 4.2387284338474274e-05, 4.54392284154892e-05, 4.849117249250412e-05, 5.154311656951904e-05, 5.4595060646533966e-05, 5.764700472354889e-05, 6.069894880056381e-05, 6.375089287757874e-05, 6.680283695459366e-05, 6.985478103160858e-05, 7.29067251086235e-05, 7.595866918563843e-05, 7.901061326265335e-05, 8.206255733966827e-05, 8.51145014166832e-05, 8.816644549369812e-05, 9.121838957071304e-05, 9.427033364772797e-05, 9.732227772474289e-05, 0.00010037422180175781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 6.0, 6.0, 19.0, 14.0, 27.0, 38.0, 42.0, 67.0, 85.0, 94.0, 139.0, 198.0, 270.0, 379.0, 508.0, 726.0, 1032.0, 1499.0, 2386.0, 3828.0, 7613.0, 20219.0, 111530.0, 801116.0, 64904.0, 15314.0, 6268.0, 3444.0, 2097.0, 1254.0, 973.0, 672.0, 498.0, 362.0, 242.0, 175.0, 128.0, 99.0, 87.0, 56.0, 52.0, 26.0, 29.0, 18.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.515625, -17.925537109375, -17.33544921875, -16.745361328125, -16.1552734375, -15.565185546875, -14.97509765625, -14.385009765625, -13.794921875, -13.204833984375, -12.61474609375, -12.024658203125, -11.4345703125, -10.844482421875, -10.25439453125, -9.664306640625, -9.07421875, -8.484130859375, -7.89404296875, -7.303955078125, -6.7138671875, -6.123779296875, -5.53369140625, -4.943603515625, -4.353515625, -3.763427734375, -3.17333984375, -2.583251953125, -1.9931640625, -1.403076171875, -0.81298828125, -0.222900390625, 0.3671875, 0.957275390625, 1.54736328125, 2.137451171875, 2.7275390625, 3.317626953125, 3.90771484375, 4.497802734375, 5.087890625, 5.677978515625, 6.26806640625, 6.858154296875, 7.4482421875, 8.038330078125, 8.62841796875, 9.218505859375, 9.80859375, 10.398681640625, 10.98876953125, 11.578857421875, 12.1689453125, 12.759033203125, 13.34912109375, 13.939208984375, 14.529296875, 15.119384765625, 15.70947265625, 16.299560546875, 16.8896484375, 17.479736328125, 18.06982421875, 18.659912109375, 19.25]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 11.0, 17.0, 11.0, 11.0, 16.0, 18.0, 12.0, 20.0, 31.0, 33.0, 36.0, 32.0, 37.0, 49.0, 38.0, 56.0, 80.0, 417.0, 1563.0, 79.0, 59.0, 34.0, 37.0, 45.0, 42.0, 35.0, 39.0, 17.0, 21.0, 25.0, 24.0, 12.0, 15.0, 11.0, 15.0, 4.0, 6.0, 7.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.42431640625, -30.4736328125, -29.52294921875, -28.572265625, -27.62158203125, -26.6708984375, -25.72021484375, -24.76953125, -23.81884765625, -22.8681640625, -21.91748046875, -20.966796875, -20.01611328125, -19.0654296875, -18.11474609375, -17.1640625, -16.21337890625, -15.2626953125, -14.31201171875, -13.361328125, -12.41064453125, -11.4599609375, -10.50927734375, -9.55859375, -8.60791015625, -7.6572265625, -6.70654296875, -5.755859375, -4.80517578125, -3.8544921875, -2.90380859375, -1.953125, -1.00244140625, -0.0517578125, 0.89892578125, 1.849609375, 2.80029296875, 3.7509765625, 4.70166015625, 5.65234375, 6.60302734375, 7.5537109375, 8.50439453125, 9.455078125, 10.40576171875, 11.3564453125, 12.30712890625, 13.2578125, 14.20849609375, 15.1591796875, 16.10986328125, 17.060546875, 18.01123046875, 18.9619140625, 19.91259765625, 20.86328125, 21.81396484375, 22.7646484375, 23.71533203125, 24.666015625, 25.61669921875, 26.5673828125, 27.51806640625, 28.46875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 10.0, 2.0, 4.0, 6.0, 9.0, 4.0, 13.0, 14.0, 19.0, 26.0, 29.0, 26.0, 35.0, 72.0, 90.0, 116.0, 206.0, 415.0, 833.0, 2446.0, 10272.0, 106567.0, 2984270.0, 31730.0, 5473.0, 1561.0, 592.0, 287.0, 168.0, 106.0, 69.0, 50.0, 41.0, 23.0, 21.0, 13.0, 22.0, 12.0, 11.0, 12.0, 10.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.28173828125, -47.4072265625, -45.53271484375, -43.658203125, -41.78369140625, -39.9091796875, -38.03466796875, -36.16015625, -34.28564453125, -32.4111328125, -30.53662109375, -28.662109375, -26.78759765625, -24.9130859375, -23.03857421875, -21.1640625, -19.28955078125, -17.4150390625, -15.54052734375, -13.666015625, -11.79150390625, -9.9169921875, -8.04248046875, -6.16796875, -4.29345703125, -2.4189453125, -0.54443359375, 1.330078125, 3.20458984375, 5.0791015625, 6.95361328125, 8.828125, 10.70263671875, 12.5771484375, 14.45166015625, 16.326171875, 18.20068359375, 20.0751953125, 21.94970703125, 23.82421875, 25.69873046875, 27.5732421875, 29.44775390625, 31.322265625, 33.19677734375, 35.0712890625, 36.94580078125, 38.8203125, 40.69482421875, 42.5693359375, 44.44384765625, 46.318359375, 48.19287109375, 50.0673828125, 51.94189453125, 53.81640625, 55.69091796875, 57.5654296875, 59.43994140625, 61.314453125, 63.18896484375, 65.0634765625, 66.93798828125, 68.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 961.0, 57.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7734260559082, -24.038291931152344, 7.696842193603516, 39.43197250366211, 71.1671142578125, 102.90225219726562, 134.6373748779297, 166.3725128173828, 198.10765075683594, 229.84278869628906, 261.5779113769531, 293.31304931640625, 325.0481872558594, 356.7833251953125, 388.5184326171875, 420.25360107421875, 451.98870849609375, 483.7238464355469, 515.458984375, 547.194091796875, 578.9292602539062, 610.6643676757812, 642.3995361328125, 674.1346435546875, 705.8698120117188, 737.6049194335938, 769.340087890625, 801.0751953125, 832.8103637695312, 864.5454711914062, 896.2806396484375, 928.0157470703125, 959.7508544921875, 991.4859619140625, 1023.2211303710938, 1054.956298828125, 1086.69140625, 1118.426513671875, 1150.16162109375, 1181.896728515625, 1213.6319580078125, 1245.3670654296875, 1277.1021728515625, 1308.83740234375, 1340.572509765625, 1372.3076171875, 1404.042724609375, 1435.77783203125, 1467.512939453125, 1499.248046875, 1530.983154296875, 1562.7183837890625, 1594.4534912109375, 1626.1885986328125, 1657.9237060546875, 1689.658935546875, 1721.39404296875, 1753.129150390625, 1784.8642578125, 1816.5994873046875, 1848.3345947265625, 1880.0697021484375, 1911.8048095703125, 1943.5400390625, 1975.275146484375]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 6.0, 8.0, 11.0, 12.0, 17.0, 19.0, 16.0, 18.0, 12.0, 24.0, 25.0, 37.0, 34.0, 49.0, 33.0, 49.0, 37.0, 29.0, 36.0, 36.0, 37.0, 43.0, 49.0, 36.0, 40.0, 42.0, 38.0, 34.0, 26.0, 19.0, 17.0, 19.0, 11.0, 14.0, 7.0, 13.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.44548034667969, -90.22933959960938, -87.01319885253906, -83.79705810546875, -80.5809097290039, -77.3647689819336, -74.14862823486328, -70.93248748779297, -67.71634674072266, -64.50020599365234, -61.284061431884766, -58.06792068481445, -54.85177993774414, -51.63563537597656, -48.41949462890625, -45.20335388183594, -41.98720932006836, -38.77106857299805, -35.55492401123047, -32.338783264160156, -29.122642517089844, -25.9064998626709, -22.690357208251953, -19.47421646118164, -16.258073806762695, -13.041932106018066, -9.825790405273438, -6.609647750854492, -3.3935060501098633, -0.17736434936523438, 3.038778305053711, 6.254919052124023, 9.471061706542969, 12.687203407287598, 15.903345108032227, 19.119487762451172, 22.335628509521484, 25.55177116394043, 28.767913818359375, 31.984054565429688, 35.2001953125, 38.41633605957031, 41.63248062133789, 44.8486213684082, 48.064762115478516, 51.280906677246094, 54.497047424316406, 57.71318817138672, 60.9293327331543, 64.14547729492188, 67.36161804199219, 70.5777587890625, 73.79389953613281, 77.01004028320312, 80.22618103027344, 83.44232177734375, 86.6584701538086, 89.8746109008789, 93.09075164794922, 96.30690002441406, 99.52304077148438, 102.73918151855469, 105.955322265625, 109.17146301269531, 112.38760375976562]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 6.0, 10.0, 9.0, 11.0, 6.0, 9.0, 11.0, 12.0, 16.0, 13.0, 18.0, 30.0, 30.0, 31.0, 42.0, 51.0, 71.0, 44.0, 82.0, 66.0, 66.0, 55.0, 54.0, 33.0, 29.0, 26.0, 26.0, 19.0, 21.0, 20.0, 8.0, 12.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.403076171875, -8.11083984375, -7.818603515625, -7.5263671875, -7.234130859375, -6.94189453125, -6.649658203125, -6.357421875, -6.065185546875, -5.77294921875, -5.480712890625, -5.1884765625, -4.896240234375, -4.60400390625, -4.311767578125, -4.01953125, -3.727294921875, -3.43505859375, -3.142822265625, -2.8505859375, -2.558349609375, -2.26611328125, -1.973876953125, -1.681640625, -1.389404296875, -1.09716796875, -0.804931640625, -0.5126953125, -0.220458984375, 0.07177734375, 0.364013671875, 0.65625, 0.948486328125, 1.24072265625, 1.532958984375, 1.8251953125, 2.117431640625, 2.40966796875, 2.701904296875, 2.994140625, 3.286376953125, 3.57861328125, 3.870849609375, 4.1630859375, 4.455322265625, 4.74755859375, 5.039794921875, 5.33203125, 5.624267578125, 5.91650390625, 6.208740234375, 6.5009765625, 6.793212890625, 7.08544921875, 7.377685546875, 7.669921875, 7.962158203125, 8.25439453125, 8.546630859375, 8.8388671875, 9.131103515625, 9.42333984375, 9.715576171875, 10.0078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 13.0, 14.0, 18.0, 27.0, 36.0, 45.0, 60.0, 73.0, 94.0, 154.0, 229.0, 364.0, 573.0, 992.0, 1903.0, 3919.0, 9249.0, 35531.0, 3168565.0, 935198.0, 22642.0, 7290.0, 3291.0, 1595.0, 851.0, 510.0, 314.0, 218.0, 130.0, 92.0, 67.0, 42.0, 35.0, 27.0, 24.0, 19.0, 16.0, 14.0, 11.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.9375, -42.5146484375, -41.091796875, -39.6689453125, -38.24609375, -36.8232421875, -35.400390625, -33.9775390625, -32.5546875, -31.1318359375, -29.708984375, -28.2861328125, -26.86328125, -25.4404296875, -24.017578125, -22.5947265625, -21.171875, -19.7490234375, -18.326171875, -16.9033203125, -15.48046875, -14.0576171875, -12.634765625, -11.2119140625, -9.7890625, -8.3662109375, -6.943359375, -5.5205078125, -4.09765625, -2.6748046875, -1.251953125, 0.1708984375, 1.59375, 3.0166015625, 4.439453125, 5.8623046875, 7.28515625, 8.7080078125, 10.130859375, 11.5537109375, 12.9765625, 14.3994140625, 15.822265625, 17.2451171875, 18.66796875, 20.0908203125, 21.513671875, 22.9365234375, 24.359375, 25.7822265625, 27.205078125, 28.6279296875, 30.05078125, 31.4736328125, 32.896484375, 34.3193359375, 35.7421875, 37.1650390625, 38.587890625, 40.0107421875, 41.43359375, 42.8564453125, 44.279296875, 45.7021484375, 47.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 6.0, 12.0, 9.0, 12.0, 21.0, 21.0, 15.0, 37.0, 38.0, 78.0, 130.0, 284.0, 641.0, 1100.0, 812.0, 375.0, 151.0, 96.0, 39.0, 38.0, 19.0, 22.0, 19.0, 21.0, 15.0, 15.0, 4.0, 10.0, 1.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.438720703125, -23.48681640625, -22.534912109375, -21.5830078125, -20.631103515625, -19.67919921875, -18.727294921875, -17.775390625, -16.823486328125, -15.87158203125, -14.919677734375, -13.9677734375, -13.015869140625, -12.06396484375, -11.112060546875, -10.16015625, -9.208251953125, -8.25634765625, -7.304443359375, -6.3525390625, -5.400634765625, -4.44873046875, -3.496826171875, -2.544921875, -1.593017578125, -0.64111328125, 0.310791015625, 1.2626953125, 2.214599609375, 3.16650390625, 4.118408203125, 5.0703125, 6.022216796875, 6.97412109375, 7.926025390625, 8.8779296875, 9.829833984375, 10.78173828125, 11.733642578125, 12.685546875, 13.637451171875, 14.58935546875, 15.541259765625, 16.4931640625, 17.445068359375, 18.39697265625, 19.348876953125, 20.30078125, 21.252685546875, 22.20458984375, 23.156494140625, 24.1083984375, 25.060302734375, 26.01220703125, 26.964111328125, 27.916015625, 28.867919921875, 29.81982421875, 30.771728515625, 31.7236328125, 32.675537109375, 33.62744140625, 34.579345703125, 35.53125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 15.0, 17.0, 28.0, 25.0, 63.0, 86.0, 125.0, 218.0, 438.0, 837.0, 1869.0, 4775.0, 14118.0, 52428.0, 1022673.0, 2992603.0, 75702.0, 17965.0, 5885.0, 2293.0, 985.0, 436.0, 263.0, 138.0, 101.0, 66.0, 31.0, 23.0, 17.0, 16.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -40.841796875, -39.27734375, -37.712890625, -36.1484375, -34.583984375, -33.01953125, -31.455078125, -29.890625, -28.326171875, -26.76171875, -25.197265625, -23.6328125, -22.068359375, -20.50390625, -18.939453125, -17.375, -15.810546875, -14.24609375, -12.681640625, -11.1171875, -9.552734375, -7.98828125, -6.423828125, -4.859375, -3.294921875, -1.73046875, -0.166015625, 1.3984375, 2.962890625, 4.52734375, 6.091796875, 7.65625, 9.220703125, 10.78515625, 12.349609375, 13.9140625, 15.478515625, 17.04296875, 18.607421875, 20.171875, 21.736328125, 23.30078125, 24.865234375, 26.4296875, 27.994140625, 29.55859375, 31.123046875, 32.6875, 34.251953125, 35.81640625, 37.380859375, 38.9453125, 40.509765625, 42.07421875, 43.638671875, 45.203125, 46.767578125, 48.33203125, 49.896484375, 51.4609375, 53.025390625, 54.58984375, 56.154296875, 57.71875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 9.0, 16.0, 39.0, 99.0, 177.0, 309.0, 223.0, 68.0, 36.0, 16.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.44499206542969, -43.59242248535156, -37.73985290527344, -31.887279510498047, -26.034709930419922, -20.182140350341797, -14.329566955566406, -8.476997375488281, -2.6244277954101562, 3.228142738342285, 9.080713272094727, 14.933284759521484, 20.78585433959961, 26.638423919677734, 32.490997314453125, 38.34356689453125, 44.196136474609375, 50.0487060546875, 55.901275634765625, 61.753849029541016, 67.60641479492188, 73.458984375, 79.31156158447266, 85.16413116455078, 91.0167007446289, 96.86927032470703, 102.72183990478516, 108.57441711425781, 114.42698669433594, 120.27955627441406, 126.13212585449219, 131.9846954345703, 137.83724975585938, 143.6898193359375, 149.54238891601562, 155.39495849609375, 161.24752807617188, 167.10009765625, 172.95266723632812, 178.80523681640625, 184.65780639648438, 190.5103759765625, 196.36294555664062, 202.21551513671875, 208.06808471679688, 213.920654296875, 219.77322387695312, 225.62579345703125, 231.47837829589844, 237.33094787597656, 243.1835174560547, 249.0360870361328, 254.88865661621094, 260.7412414550781, 266.59381103515625, 272.4463806152344, 278.2989501953125, 284.1515197753906, 290.00408935546875, 295.8566589355469, 301.709228515625, 307.5617980957031, 313.41436767578125, 319.2669372558594, 325.1195068359375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 10.0, 6.0, 13.0, 14.0, 12.0, 14.0, 25.0, 20.0, 23.0, 21.0, 28.0, 28.0, 30.0, 32.0, 24.0, 30.0, 35.0, 37.0, 43.0, 38.0, 41.0, 39.0, 41.0, 41.0, 42.0, 41.0, 27.0, 37.0, 22.0, 27.0, 21.0, 27.0, 16.0, 17.0, 9.0, 11.0, 8.0, 5.0, 6.0, 7.0, 1.0, 8.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-79.05381774902344, -76.65140533447266, -74.24899291992188, -71.84658813476562, -69.44417572021484, -67.04176330566406, -64.63935089111328, -62.2369384765625, -59.834529876708984, -57.4321174621582, -55.02970886230469, -52.627296447753906, -50.224884033203125, -47.82247543334961, -45.42006301879883, -43.01765441894531, -40.61524200439453, -38.21282958984375, -35.810420989990234, -33.40800857543945, -31.005598068237305, -28.603187561035156, -26.200775146484375, -23.798364639282227, -21.395954132080078, -18.99354362487793, -16.59113311767578, -14.188720703125, -11.786310195922852, -9.383899688720703, -6.981488227844238, -4.579076766967773, -2.176666259765625, 0.22574472427368164, 2.6281557083129883, 5.030566692352295, 7.432977676391602, 9.83538818359375, 12.237799644470215, 14.64021110534668, 17.042621612548828, 19.445032119750977, 21.847442626953125, 24.249855041503906, 26.652265548706055, 29.054676055908203, 31.457088470458984, 33.8594970703125, 36.26190948486328, 38.66432189941406, 41.06673049926758, 43.46914291381836, 45.871551513671875, 48.273963928222656, 50.67637634277344, 53.07878875732422, 55.481197357177734, 57.883609771728516, 60.28601837158203, 62.68843078613281, 65.0908432006836, 67.49325561523438, 69.89566040039062, 72.2980728149414, 74.70048522949219]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 16.0, 21.0, 29.0, 42.0, 58.0, 92.0, 140.0, 198.0, 291.0, 383.0, 602.0, 903.0, 1415.0, 2069.0, 3244.0, 5069.0, 7863.0, 12682.0, 20447.0, 33906.0, 58124.0, 105139.0, 200613.0, 265556.0, 140401.0, 76671.0, 43141.0, 25716.0, 15952.0, 9848.0, 6182.0, 4023.0, 2674.0, 1643.0, 1087.0, 731.0, 520.0, 318.0, 222.0, 157.0, 115.0, 79.0, 51.0, 30.0, 30.0, 20.0, 8.0, 5.0, 8.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16334915161132812, -0.15811920166015625, -0.15288925170898438, -0.1476593017578125, -0.14242935180664062, -0.13719940185546875, -0.13196945190429688, -0.126739501953125, -0.12150955200195312, -0.11627960205078125, -0.11104965209960938, -0.1058197021484375, -0.10058975219726562, -0.09535980224609375, -0.09012985229492188, -0.08489990234375, -0.07966995239257812, -0.07444000244140625, -0.06921005249023438, -0.0639801025390625, -0.058750152587890625, -0.05352020263671875, -0.048290252685546875, -0.043060302734375, -0.037830352783203125, -0.03260040283203125, -0.027370452880859375, -0.0221405029296875, -0.016910552978515625, -0.01168060302734375, -0.006450653076171875, -0.001220703125, 0.004009246826171875, 0.00923919677734375, 0.014469146728515625, 0.0196990966796875, 0.024929046630859375, 0.03015899658203125, 0.035388946533203125, 0.040618896484375, 0.045848846435546875, 0.05107879638671875, 0.056308746337890625, 0.0615386962890625, 0.06676864624023438, 0.07199859619140625, 0.07722854614257812, 0.08245849609375, 0.08768844604492188, 0.09291839599609375, 0.09814834594726562, 0.1033782958984375, 0.10860824584960938, 0.11383819580078125, 0.11906814575195312, 0.124298095703125, 0.12952804565429688, 0.13475799560546875, 0.13998794555664062, 0.1452178955078125, 0.15044784545898438, 0.15567779541015625, 0.16090774536132812, 0.1661376953125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 6.0, 7.0, 6.0, 9.0, 11.0, 19.0, 19.0, 22.0, 18.0, 27.0, 32.0, 27.0, 42.0, 32.0, 32.0, 48.0, 47.0, 41.0, 1066.0, 52.0, 50.0, 41.0, 48.0, 34.0, 41.0, 33.0, 25.0, 28.0, 29.0, 22.0, 14.0, 14.0, 9.0, 12.0, 8.0, 12.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.50140380859375, -4.3660888671875, -4.23077392578125, -4.095458984375, -3.96014404296875, -3.8248291015625, -3.68951416015625, -3.55419921875, -3.41888427734375, -3.2835693359375, -3.14825439453125, -3.012939453125, -2.87762451171875, -2.7423095703125, -2.60699462890625, -2.4716796875, -2.33636474609375, -2.2010498046875, -2.06573486328125, -1.930419921875, -1.79510498046875, -1.6597900390625, -1.52447509765625, -1.38916015625, -1.25384521484375, -1.1185302734375, -0.98321533203125, -0.847900390625, -0.71258544921875, -0.5772705078125, -0.44195556640625, -0.306640625, -0.17132568359375, -0.0360107421875, 0.09930419921875, 0.234619140625, 0.36993408203125, 0.5052490234375, 0.64056396484375, 0.77587890625, 0.91119384765625, 1.0465087890625, 1.18182373046875, 1.317138671875, 1.45245361328125, 1.5877685546875, 1.72308349609375, 1.8583984375, 1.99371337890625, 2.1290283203125, 2.26434326171875, 2.399658203125, 2.53497314453125, 2.6702880859375, 2.80560302734375, 2.94091796875, 3.07623291015625, 3.2115478515625, 3.34686279296875, 3.482177734375, 3.61749267578125, 3.7528076171875, 3.88812255859375, 4.0234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 9.0, 12.0, 19.0, 30.0, 31.0, 67.0, 93.0, 134.0, 203.0, 246.0, 413.0, 540.0, 826.0, 1162.0, 1765.0, 2486.0, 3837.0, 5561.0, 8392.0, 12643.0, 18930.0, 28477.0, 43976.0, 66942.0, 106046.0, 169602.0, 1250352.0, 132505.0, 83545.0, 53693.0, 35029.0, 23111.0, 15461.0, 10020.0, 6748.0, 4483.0, 3084.0, 2017.0, 1439.0, 972.0, 729.0, 440.0, 329.0, 207.0, 162.0, 119.0, 81.0, 59.0, 44.0, 26.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0650634765625, -0.06304550170898438, -0.06102752685546875, -0.059009552001953125, -0.0569915771484375, -0.054973602294921875, -0.05295562744140625, -0.050937652587890625, -0.048919677734375, -0.046901702880859375, -0.04488372802734375, -0.042865753173828125, -0.0408477783203125, -0.038829803466796875, -0.03681182861328125, -0.034793853759765625, -0.03277587890625, -0.030757904052734375, -0.02873992919921875, -0.026721954345703125, -0.0247039794921875, -0.022686004638671875, -0.02066802978515625, -0.018650054931640625, -0.016632080078125, -0.014614105224609375, -0.01259613037109375, -0.010578155517578125, -0.0085601806640625, -0.006542205810546875, -0.00452423095703125, -0.002506256103515625, -0.00048828125, 0.001529693603515625, 0.00354766845703125, 0.005565643310546875, 0.0075836181640625, 0.009601593017578125, 0.01161956787109375, 0.013637542724609375, 0.015655517578125, 0.017673492431640625, 0.01969146728515625, 0.021709442138671875, 0.0237274169921875, 0.025745391845703125, 0.02776336669921875, 0.029781341552734375, 0.03179931640625, 0.033817291259765625, 0.03583526611328125, 0.037853240966796875, 0.0398712158203125, 0.041889190673828125, 0.04390716552734375, 0.045925140380859375, 0.047943115234375, 0.049961090087890625, 0.05197906494140625, 0.053997039794921875, 0.0560150146484375, 0.058032989501953125, 0.06005096435546875, 0.062068939208984375, 0.0640869140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 4.0, 7.0, 7.0, 6.0, 12.0, 21.0, 18.0, 20.0, 26.0, 31.0, 38.0, 45.0, 62.0, 70.0, 74.0, 67.0, 77.0, 61.0, 60.0, 40.0, 50.0, 37.0, 30.0, 16.0, 25.0, 19.0, 17.0, 14.0, 5.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00015294551849365234, -0.00014812685549259186, -0.00014330819249153137, -0.00013848952949047089, -0.0001336708664894104, -0.00012885220348834991, -0.00012403354048728943, -0.00011921487748622894, -0.00011439621448516846, -0.00010957755148410797, -0.00010475888848304749, -9.9940225481987e-05, -9.512156248092651e-05, -9.030289947986603e-05, -8.548423647880554e-05, -8.066557347774506e-05, -7.584691047668457e-05, -7.102824747562408e-05, -6.62095844745636e-05, -6.139092147350311e-05, -5.657225847244263e-05, -5.175359547138214e-05, -4.6934932470321655e-05, -4.211626946926117e-05, -3.7297606468200684e-05, -3.24789434671402e-05, -2.7660280466079712e-05, -2.2841617465019226e-05, -1.802295446395874e-05, -1.3204291462898254e-05, -8.385628461837769e-06, -3.5669654607772827e-06, 1.2516975402832031e-06, 6.070360541343689e-06, 1.0889023542404175e-05, 1.570768654346466e-05, 2.0526349544525146e-05, 2.5345012545585632e-05, 3.0163675546646118e-05, 3.4982338547706604e-05, 3.980100154876709e-05, 4.4619664549827576e-05, 4.943832755088806e-05, 5.425699055194855e-05, 5.907565355300903e-05, 6.389431655406952e-05, 6.871297955513e-05, 7.353164255619049e-05, 7.835030555725098e-05, 8.316896855831146e-05, 8.798763155937195e-05, 9.280629456043243e-05, 9.762495756149292e-05, 0.0001024436205625534, 0.00010726228356361389, 0.00011208094656467438, 0.00011689960956573486, 0.00012171827256679535, 0.00012653693556785583, 0.00013135559856891632, 0.0001361742615699768, 0.0001409929245710373, 0.00014581158757209778, 0.00015063025057315826, 0.00015544891357421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 11.0, 7.0, 13.0, 19.0, 15.0, 26.0, 16.0, 33.0, 36.0, 61.0, 78.0, 90.0, 87.0, 134.0, 173.0, 224.0, 349.0, 1076.0, 35244.0, 999309.0, 9600.0, 678.0, 299.0, 199.0, 152.0, 135.0, 100.0, 72.0, 69.0, 58.0, 45.0, 22.0, 22.0, 19.0, 18.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.00244903564453125, -0.0023733675479888916, -0.002297699451446533, -0.002222031354904175, -0.0021463632583618164, -0.002070695161819458, -0.0019950270652770996, -0.0019193589687347412, -0.0018436908721923828, -0.0017680227756500244, -0.001692354679107666, -0.0016166865825653076, -0.0015410184860229492, -0.0014653503894805908, -0.0013896822929382324, -0.001314014196395874, -0.0012383460998535156, -0.0011626780033111572, -0.0010870099067687988, -0.0010113418102264404, -0.000935673713684082, -0.0008600056171417236, -0.0007843375205993652, -0.0007086694240570068, -0.0006330013275146484, -0.00055733323097229, -0.00048166513442993164, -0.00040599703788757324, -0.00033032894134521484, -0.00025466084480285645, -0.00017899274826049805, -0.00010332465171813965, -2.765655517578125e-05, 4.801154136657715e-05, 0.00012367963790893555, 0.00019934773445129395, 0.00027501583099365234, 0.00035068392753601074, 0.00042635202407836914, 0.0005020201206207275, 0.0005776882171630859, 0.0006533563137054443, 0.0007290244102478027, 0.0008046925067901611, 0.0008803606033325195, 0.0009560286998748779, 0.0010316967964172363, 0.0011073648929595947, 0.0011830329895019531, 0.0012587010860443115, 0.00133436918258667, 0.0014100372791290283, 0.0014857053756713867, 0.0015613734722137451, 0.0016370415687561035, 0.001712709665298462, 0.0017883777618408203, 0.0018640458583831787, 0.0019397139549255371, 0.0020153820514678955, 0.002091050148010254, 0.0021667182445526123, 0.0022423863410949707, 0.002318054437637329, 0.0023937225341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 21.0, 82.0, 391.0, 362.0, 85.0, 37.0, 12.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.0005354912136681378, -0.0005259194294922054, -0.0005163475871086121, -0.0005067758029326797, -0.0004972039605490863, -0.00048763214726932347, -0.0004780603339895606, -0.00046848852070979774, -0.0004589167074300349, -0.000449344894150272, -0.00043977308087050915, -0.0004302012675907463, -0.0004206294543109834, -0.00041105764103122056, -0.0004014858277514577, -0.0003919140144716948, -0.00038234220119193196, -0.0003727703879121691, -0.00036319857463240623, -0.00035362676135264337, -0.0003440549480728805, -0.00033448313479311764, -0.0003249113215133548, -0.0003153395082335919, -0.0003057677240576595, -0.00029619591077789664, -0.0002866240974981338, -0.0002770522842183709, -0.00026748047093860805, -0.0002579086576588452, -0.0002483368443790823, -0.00023876503109931946, -0.00022919323237147182, -0.00021962141909170896, -0.0002100496058119461, -0.00020047779253218323, -0.00019090597925242037, -0.0001813341659726575, -0.00017176236724480987, -0.000162190553965047, -0.00015261874068528414, -0.00014304692740552127, -0.0001334751141257584, -0.00012390330084599555, -0.00011433148756623268, -0.00010475967428646982, -9.518786828266457e-05, -8.56160550029017e-05, -7.604423444718122e-05, -6.647242116741836e-05, -5.6900607887655497e-05, -4.732879824587144e-05, -3.7756984966108575e-05, -2.818517168634571e-05, -1.8613362044561654e-05, -9.04154876479879e-06, 5.302645149640739e-07, 1.0102076885232236e-05, 1.96738892555004e-05, 2.924570071627386e-05, 3.881751399603672e-05, 4.838932727579959e-05, 5.7961136917583644e-05, 6.753295019734651e-05, 7.710476347710937e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 10.0, 9.0, 10.0, 15.0, 23.0, 27.0, 28.0, 28.0, 27.0, 29.0, 36.0, 51.0, 48.0, 29.0, 51.0, 43.0, 48.0, 43.0, 39.0, 41.0, 41.0, 28.0, 34.0, 32.0, 22.0, 35.0, 31.0, 24.0, 10.0, 14.0, 11.0, 8.0, 13.0, 11.0, 4.0, 6.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.738040924072266e-05, -8.438806980848312e-05, -8.139573037624359e-05, -7.840339094400406e-05, -7.541105151176453e-05, -7.2418712079525e-05, -6.942637264728546e-05, -6.643403321504593e-05, -6.34416937828064e-05, -6.0449354350566864e-05, -5.745701491832733e-05, -5.44646754860878e-05, -5.1472336053848267e-05, -4.8479996621608734e-05, -4.54876571893692e-05, -4.249531775712967e-05, -3.950297832489014e-05, -3.6510638892650604e-05, -3.351829946041107e-05, -3.052596002817154e-05, -2.7533620595932007e-05, -2.4541281163692474e-05, -2.1548941731452942e-05, -1.855660229921341e-05, -1.5564262866973877e-05, -1.2571923434734344e-05, -9.579584002494812e-06, -6.5872445702552795e-06, -3.594905138015747e-06, -6.025657057762146e-07, 2.389773726463318e-06, 5.38211315870285e-06, 8.374452590942383e-06, 1.1366792023181915e-05, 1.4359131455421448e-05, 1.735147088766098e-05, 2.0343810319900513e-05, 2.3336149752140045e-05, 2.6328489184379578e-05, 2.932082861661911e-05, 3.231316804885864e-05, 3.5305507481098175e-05, 3.829784691333771e-05, 4.129018634557724e-05, 4.428252577781677e-05, 4.7274865210056305e-05, 5.026720464229584e-05, 5.325954407453537e-05, 5.62518835067749e-05, 5.9244222939014435e-05, 6.223656237125397e-05, 6.52289018034935e-05, 6.822124123573303e-05, 7.121358066797256e-05, 7.42059201002121e-05, 7.719825953245163e-05, 8.019059896469116e-05, 8.31829383969307e-05, 8.617527782917023e-05, 8.916761726140976e-05, 9.215995669364929e-05, 9.515229612588882e-05, 9.814463555812836e-05, 0.00010113697499036789, 0.00010412931442260742]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 3.0, 6.0, 9.0, 10.0, 21.0, 26.0, 39.0, 47.0, 93.0, 111.0, 172.0, 251.0, 364.0, 525.0, 771.0, 1273.0, 2559.0, 7108.0, 52627.0, 909271.0, 59406.0, 7361.0, 2642.0, 1369.0, 805.0, 507.0, 371.0, 247.0, 172.0, 117.0, 88.0, 47.0, 50.0, 17.0, 16.0, 14.0, 11.0, 5.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.782958984375, -19.11279296875, -18.442626953125, -17.7724609375, -17.102294921875, -16.43212890625, -15.761962890625, -15.091796875, -14.421630859375, -13.75146484375, -13.081298828125, -12.4111328125, -11.740966796875, -11.07080078125, -10.400634765625, -9.73046875, -9.060302734375, -8.39013671875, -7.719970703125, -7.0498046875, -6.379638671875, -5.70947265625, -5.039306640625, -4.369140625, -3.698974609375, -3.02880859375, -2.358642578125, -1.6884765625, -1.018310546875, -0.34814453125, 0.322021484375, 0.9921875, 1.662353515625, 2.33251953125, 3.002685546875, 3.6728515625, 4.343017578125, 5.01318359375, 5.683349609375, 6.353515625, 7.023681640625, 7.69384765625, 8.364013671875, 9.0341796875, 9.704345703125, 10.37451171875, 11.044677734375, 11.71484375, 12.385009765625, 13.05517578125, 13.725341796875, 14.3955078125, 15.065673828125, 15.73583984375, 16.406005859375, 17.076171875, 17.746337890625, 18.41650390625, 19.086669921875, 19.7568359375, 20.427001953125, 21.09716796875, 21.767333984375, 22.4375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 9.0, 11.0, 15.0, 14.0, 18.0, 33.0, 27.0, 29.0, 31.0, 40.0, 35.0, 34.0, 45.0, 60.0, 106.0, 1716.0, 268.0, 85.0, 54.0, 44.0, 54.0, 35.0, 42.0, 28.0, 28.0, 30.0, 20.0, 15.0, 14.0, 15.0, 20.0, 12.0, 9.0, 4.0, 7.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.640625, -29.706298828125, -28.77197265625, -27.837646484375, -26.9033203125, -25.968994140625, -25.03466796875, -24.100341796875, -23.166015625, -22.231689453125, -21.29736328125, -20.363037109375, -19.4287109375, -18.494384765625, -17.56005859375, -16.625732421875, -15.69140625, -14.757080078125, -13.82275390625, -12.888427734375, -11.9541015625, -11.019775390625, -10.08544921875, -9.151123046875, -8.216796875, -7.282470703125, -6.34814453125, -5.413818359375, -4.4794921875, -3.545166015625, -2.61083984375, -1.676513671875, -0.7421875, 0.192138671875, 1.12646484375, 2.060791015625, 2.9951171875, 3.929443359375, 4.86376953125, 5.798095703125, 6.732421875, 7.666748046875, 8.60107421875, 9.535400390625, 10.4697265625, 11.404052734375, 12.33837890625, 13.272705078125, 14.20703125, 15.141357421875, 16.07568359375, 17.010009765625, 17.9443359375, 18.878662109375, 19.81298828125, 20.747314453125, 21.681640625, 22.615966796875, 23.55029296875, 24.484619140625, 25.4189453125, 26.353271484375, 27.28759765625, 28.221923828125, 29.15625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 17.0, 11.0, 18.0, 20.0, 21.0, 29.0, 27.0, 51.0, 71.0, 117.0, 219.0, 434.0, 974.0, 2438.0, 10508.0, 2923485.0, 198011.0, 5825.0, 1736.0, 754.0, 343.0, 178.0, 102.0, 67.0, 51.0, 49.0, 24.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.5625, -46.02001953125, -44.4775390625, -42.93505859375, -41.392578125, -39.85009765625, -38.3076171875, -36.76513671875, -35.22265625, -33.68017578125, -32.1376953125, -30.59521484375, -29.052734375, -27.51025390625, -25.9677734375, -24.42529296875, -22.8828125, -21.34033203125, -19.7978515625, -18.25537109375, -16.712890625, -15.17041015625, -13.6279296875, -12.08544921875, -10.54296875, -9.00048828125, -7.4580078125, -5.91552734375, -4.373046875, -2.83056640625, -1.2880859375, 0.25439453125, 1.796875, 3.33935546875, 4.8818359375, 6.42431640625, 7.966796875, 9.50927734375, 11.0517578125, 12.59423828125, 14.13671875, 15.67919921875, 17.2216796875, 18.76416015625, 20.306640625, 21.84912109375, 23.3916015625, 24.93408203125, 26.4765625, 28.01904296875, 29.5615234375, 31.10400390625, 32.646484375, 34.18896484375, 35.7314453125, 37.27392578125, 38.81640625, 40.35888671875, 41.9013671875, 43.44384765625, 44.986328125, 46.52880859375, 48.0712890625, 49.61376953125, 51.15625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 54.0, 385.0, 496.0, 61.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.58192443847656, -109.81767272949219, -104.05342864990234, -98.28917694091797, -92.52493286132812, -86.76068115234375, -80.99642944335938, -75.23218536376953, -69.46794128417969, -63.70369338989258, -57.93944549560547, -52.175193786621094, -46.41094970703125, -40.646697998046875, -34.882450103759766, -29.118202209472656, -23.35395050048828, -17.589702606201172, -11.825453758239746, -6.06120491027832, -0.29695701599121094, 5.467290878295898, 11.23154067993164, 16.99578857421875, 22.76003646850586, 28.52428436279297, 34.28853225708008, 40.05278015136719, 45.81703186035156, 51.581275939941406, 57.34552764892578, 63.10977554321289, 68.8740234375, 74.63827514648438, 80.40251922607422, 86.1667709350586, 91.93101501464844, 97.69526672363281, 103.45951843261719, 109.22376251220703, 114.98800659179688, 120.75225830078125, 126.5165023803711, 132.28074645996094, 138.0449981689453, 143.8092498779297, 149.57350158691406, 155.33773803710938, 161.10198974609375, 166.86624145507812, 172.6304931640625, 178.3947296142578, 184.1589813232422, 189.92323303222656, 195.68748474121094, 201.45172119140625, 207.2159881591797, 212.98023986816406, 218.74449157714844, 224.50872802734375, 230.27297973632812, 236.0372314453125, 241.80148315429688, 247.56573486328125, 253.32997131347656]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 12.0, 13.0, 18.0, 26.0, 24.0, 21.0, 21.0, 22.0, 33.0, 31.0, 40.0, 42.0, 39.0, 34.0, 42.0, 52.0, 55.0, 36.0, 46.0, 33.0, 43.0, 33.0, 38.0, 35.0, 31.0, 28.0, 23.0, 25.0, 16.0, 6.0, 18.0, 8.0, 5.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.51428985595703, -100.1222915649414, -96.73029327392578, -93.33828735351562, -89.9462890625, -86.55429077148438, -83.16229248046875, -79.77029418945312, -76.3782958984375, -72.98629760742188, -69.59429931640625, -66.20230102539062, -62.81029510498047, -59.418296813964844, -56.02629852294922, -52.634300231933594, -49.24229431152344, -45.85029602050781, -42.45829391479492, -39.0662956237793, -35.674293518066406, -32.28229522705078, -28.890296936035156, -25.4982967376709, -22.10629653930664, -18.714296340942383, -15.322297096252441, -11.9302978515625, -8.538297653198242, -5.146297454833984, -1.7542991638183594, 1.6377010345458984, 5.029701232910156, 8.421701431274414, 11.813700675964355, 15.205699920654297, 18.597700119018555, 21.989700317382812, 25.381698608398438, 28.773698806762695, 32.16569900512695, 35.55769729614258, 38.94969940185547, 42.341697692871094, 45.73369598388672, 49.12569808959961, 52.517696380615234, 55.909698486328125, 59.30169677734375, 62.693695068359375, 66.085693359375, 69.47769165039062, 72.86969757080078, 76.2616958618164, 79.65369415283203, 83.04569244384766, 86.43769836425781, 89.82969665527344, 93.22169494628906, 96.61369323730469, 100.00569915771484, 103.39769744873047, 106.7896957397461, 110.18169403076172, 113.57369232177734]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 7.0, 13.0, 8.0, 10.0, 14.0, 10.0, 17.0, 24.0, 22.0, 22.0, 41.0, 37.0, 46.0, 57.0, 54.0, 63.0, 71.0, 58.0, 64.0, 57.0, 42.0, 31.0, 32.0, 21.0, 29.0, 22.0, 17.0, 20.0, 11.0, 13.0, 9.0, 6.0, 4.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.62890625, -8.3359375, -8.04296875, -7.75, -7.45703125, -7.1640625, -6.87109375, -6.578125, -6.28515625, -5.9921875, -5.69921875, -5.40625, -5.11328125, -4.8203125, -4.52734375, -4.234375, -3.94140625, -3.6484375, -3.35546875, -3.0625, -2.76953125, -2.4765625, -2.18359375, -1.890625, -1.59765625, -1.3046875, -1.01171875, -0.71875, -0.42578125, -0.1328125, 0.16015625, 0.453125, 0.74609375, 1.0390625, 1.33203125, 1.625, 1.91796875, 2.2109375, 2.50390625, 2.796875, 3.08984375, 3.3828125, 3.67578125, 3.96875, 4.26171875, 4.5546875, 4.84765625, 5.140625, 5.43359375, 5.7265625, 6.01953125, 6.3125, 6.60546875, 6.8984375, 7.19140625, 7.484375, 7.77734375, 8.0703125, 8.36328125, 8.65625, 8.94921875, 9.2421875, 9.53515625, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 6.0, 11.0, 22.0, 38.0, 41.0, 51.0, 74.0, 99.0, 162.0, 273.0, 332.0, 539.0, 841.0, 1310.0, 2376.0, 4371.0, 8819.0, 27489.0, 698260.0, 3317458.0, 104353.0, 13454.0, 5952.0, 3182.0, 1726.0, 1023.0, 659.0, 439.0, 286.0, 172.0, 140.0, 89.0, 59.0, 39.0, 29.0, 25.0, 16.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.201416015625, -29.16845703125, -28.135498046875, -27.1025390625, -26.069580078125, -25.03662109375, -24.003662109375, -22.970703125, -21.937744140625, -20.90478515625, -19.871826171875, -18.8388671875, -17.805908203125, -16.77294921875, -15.739990234375, -14.70703125, -13.674072265625, -12.64111328125, -11.608154296875, -10.5751953125, -9.542236328125, -8.50927734375, -7.476318359375, -6.443359375, -5.410400390625, -4.37744140625, -3.344482421875, -2.3115234375, -1.278564453125, -0.24560546875, 0.787353515625, 1.8203125, 2.853271484375, 3.88623046875, 4.919189453125, 5.9521484375, 6.985107421875, 8.01806640625, 9.051025390625, 10.083984375, 11.116943359375, 12.14990234375, 13.182861328125, 14.2158203125, 15.248779296875, 16.28173828125, 17.314697265625, 18.34765625, 19.380615234375, 20.41357421875, 21.446533203125, 22.4794921875, 23.512451171875, 24.54541015625, 25.578369140625, 26.611328125, 27.644287109375, 28.67724609375, 29.710205078125, 30.7431640625, 31.776123046875, 32.80908203125, 33.842041015625, 34.875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 11.0, 21.0, 25.0, 42.0, 79.0, 156.0, 480.0, 1417.0, 1166.0, 349.0, 107.0, 55.0, 43.0, 29.0, 19.0, 15.0, 16.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -33.654296875, -32.24609375, -30.837890625, -29.4296875, -28.021484375, -26.61328125, -25.205078125, -23.796875, -22.388671875, -20.98046875, -19.572265625, -18.1640625, -16.755859375, -15.34765625, -13.939453125, -12.53125, -11.123046875, -9.71484375, -8.306640625, -6.8984375, -5.490234375, -4.08203125, -2.673828125, -1.265625, 0.142578125, 1.55078125, 2.958984375, 4.3671875, 5.775390625, 7.18359375, 8.591796875, 10.0, 11.408203125, 12.81640625, 14.224609375, 15.6328125, 17.041015625, 18.44921875, 19.857421875, 21.265625, 22.673828125, 24.08203125, 25.490234375, 26.8984375, 28.306640625, 29.71484375, 31.123046875, 32.53125, 33.939453125, 35.34765625, 36.755859375, 38.1640625, 39.572265625, 40.98046875, 42.388671875, 43.796875, 45.205078125, 46.61328125, 48.021484375, 49.4296875, 50.837890625, 52.24609375, 53.654296875, 55.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 15.0, 15.0, 33.0, 61.0, 90.0, 160.0, 396.0, 1100.0, 4279.0, 29231.0, 3601926.0, 536361.0, 16346.0, 2785.0, 837.0, 300.0, 136.0, 94.0, 48.0, 18.0, 17.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.3125, -102.4560546875, -99.599609375, -96.7431640625, -93.88671875, -91.0302734375, -88.173828125, -85.3173828125, -82.4609375, -79.6044921875, -76.748046875, -73.8916015625, -71.03515625, -68.1787109375, -65.322265625, -62.4658203125, -59.609375, -56.7529296875, -53.896484375, -51.0400390625, -48.18359375, -45.3271484375, -42.470703125, -39.6142578125, -36.7578125, -33.9013671875, -31.044921875, -28.1884765625, -25.33203125, -22.4755859375, -19.619140625, -16.7626953125, -13.90625, -11.0498046875, -8.193359375, -5.3369140625, -2.48046875, 0.3759765625, 3.232421875, 6.0888671875, 8.9453125, 11.8017578125, 14.658203125, 17.5146484375, 20.37109375, 23.2275390625, 26.083984375, 28.9404296875, 31.796875, 34.6533203125, 37.509765625, 40.3662109375, 43.22265625, 46.0791015625, 48.935546875, 51.7919921875, 54.6484375, 57.5048828125, 60.361328125, 63.2177734375, 66.07421875, 68.9306640625, 71.787109375, 74.6435546875, 77.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 67.0, 384.0, 447.0, 76.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.3537902832031, -335.4908447265625, -322.6278991699219, -309.76495361328125, -296.9020080566406, -284.0390625, -271.1761474609375, -258.31317138671875, -245.4502410888672, -232.58729553222656, -219.72434997558594, -206.86141967773438, -193.99847412109375, -181.13552856445312, -168.2725830078125, -155.40963745117188, -142.54669189453125, -129.68374633789062, -116.82080078125, -103.9578628540039, -91.09491729736328, -78.23197174072266, -65.36903381347656, -52.50608825683594, -39.64314270019531, -26.78019905090332, -13.917255401611328, -1.0543136596679688, 11.808631896972656, 24.67157745361328, 37.534515380859375, 50.3974609375, 63.260406494140625, 76.12335205078125, 88.98629760742188, 101.84923553466797, 114.7121810913086, 127.57512664794922, 140.4380645751953, 153.30101013183594, 166.16395568847656, 179.0269012451172, 191.8898468017578, 204.75277709960938, 217.61572265625, 230.47866821289062, 243.34161376953125, 256.2045593261719, 269.0675048828125, 281.9304504394531, 294.79339599609375, 307.6563415527344, 320.519287109375, 333.3822326660156, 346.24517822265625, 359.10809326171875, 371.9710693359375, 384.8340148925781, 397.69696044921875, 410.5599060058594, 423.4228515625, 436.2857971191406, 449.14874267578125, 462.01165771484375, 474.8746032714844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 8.0, 7.0, 15.0, 11.0, 7.0, 18.0, 18.0, 14.0, 21.0, 30.0, 34.0, 24.0, 38.0, 40.0, 33.0, 21.0, 29.0, 41.0, 39.0, 35.0, 38.0, 44.0, 37.0, 37.0, 41.0, 29.0, 32.0, 27.0, 27.0, 35.0, 18.0, 20.0, 21.0, 14.0, 14.0, 14.0, 13.0, 10.0, 6.0, 9.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-78.59513092041016, -76.32500457763672, -74.05488586425781, -71.78475952148438, -69.51463317871094, -67.2445068359375, -64.9743881225586, -62.704261779785156, -60.434139251708984, -58.16401672363281, -55.893890380859375, -53.6237678527832, -51.35364532470703, -49.083518981933594, -46.81339645385742, -44.54327392578125, -42.27314758300781, -40.00302505493164, -37.7328987121582, -35.46277618408203, -33.192649841308594, -30.922527313232422, -28.65240478515625, -26.382280349731445, -24.11215591430664, -21.842031478881836, -19.57190704345703, -17.30178451538086, -15.031660079956055, -12.76153564453125, -10.491412162780762, -8.221288681030273, -5.9511566162109375, -3.681032657623291, -1.4109086990356445, 0.859215259552002, 3.1293392181396484, 5.399463653564453, 7.669587135314941, 9.93971061706543, 12.209835052490234, 14.479959487915039, 16.750083923339844, 19.020206451416016, 21.29033088684082, 23.560455322265625, 25.830577850341797, 28.1007022857666, 30.370826721191406, 32.64094924926758, 34.911075592041016, 37.18119812011719, 39.451324462890625, 41.7214469909668, 43.99156951904297, 46.261695861816406, 48.53181838989258, 50.80194091796875, 53.07206726074219, 55.34218978881836, 57.61231231689453, 59.88243865966797, 62.15256118774414, 64.42268371582031, 66.69281005859375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 23.0, 21.0, 42.0, 57.0, 54.0, 99.0, 119.0, 215.0, 306.0, 377.0, 536.0, 776.0, 1119.0, 1593.0, 2320.0, 3214.0, 4743.0, 7189.0, 10487.0, 16367.0, 25248.0, 40103.0, 64931.0, 107957.0, 178207.0, 218938.0, 138440.0, 83256.0, 50114.0, 31307.0, 19854.0, 13069.0, 8577.0, 5915.0, 3894.0, 2781.0, 1831.0, 1316.0, 948.0, 660.0, 451.0, 321.0, 230.0, 134.0, 113.0, 91.0, 71.0, 37.0, 29.0, 23.0, 17.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0], "bins": [-0.147705078125, -0.14312362670898438, -0.13854217529296875, -0.13396072387695312, -0.1293792724609375, -0.12479782104492188, -0.12021636962890625, -0.11563491821289062, -0.111053466796875, -0.10647201538085938, -0.10189056396484375, -0.09730911254882812, -0.0927276611328125, -0.08814620971679688, -0.08356475830078125, -0.07898330688476562, -0.07440185546875, -0.06982040405273438, -0.06523895263671875, -0.060657501220703125, -0.0560760498046875, -0.051494598388671875, -0.04691314697265625, -0.042331695556640625, -0.037750244140625, -0.033168792724609375, -0.02858734130859375, -0.024005889892578125, -0.0194244384765625, -0.014842987060546875, -0.01026153564453125, -0.005680084228515625, -0.0010986328125, 0.003482818603515625, 0.00806427001953125, 0.012645721435546875, 0.0172271728515625, 0.021808624267578125, 0.02639007568359375, 0.030971527099609375, 0.035552978515625, 0.040134429931640625, 0.04471588134765625, 0.049297332763671875, 0.0538787841796875, 0.058460235595703125, 0.06304168701171875, 0.06762313842773438, 0.07220458984375, 0.07678604125976562, 0.08136749267578125, 0.08594894409179688, 0.0905303955078125, 0.09511184692382812, 0.09969329833984375, 0.10427474975585938, 0.108856201171875, 0.11343765258789062, 0.11801910400390625, 0.12260055541992188, 0.1271820068359375, 0.13176345825195312, 0.13634490966796875, 0.14092636108398438, 0.1455078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 6.0, 3.0, 8.0, 6.0, 13.0, 12.0, 12.0, 13.0, 17.0, 18.0, 22.0, 19.0, 22.0, 22.0, 33.0, 34.0, 40.0, 33.0, 40.0, 55.0, 43.0, 1060.0, 39.0, 32.0, 49.0, 35.0, 39.0, 34.0, 32.0, 31.0, 25.0, 18.0, 29.0, 15.0, 13.0, 17.0, 16.0, 11.0, 8.0, 12.0, 6.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1640625, -4.03155517578125, -3.8990478515625, -3.76654052734375, -3.634033203125, -3.50152587890625, -3.3690185546875, -3.23651123046875, -3.10400390625, -2.97149658203125, -2.8389892578125, -2.70648193359375, -2.573974609375, -2.44146728515625, -2.3089599609375, -2.17645263671875, -2.0439453125, -1.91143798828125, -1.7789306640625, -1.64642333984375, -1.513916015625, -1.38140869140625, -1.2489013671875, -1.11639404296875, -0.98388671875, -0.85137939453125, -0.7188720703125, -0.58636474609375, -0.453857421875, -0.32135009765625, -0.1888427734375, -0.05633544921875, 0.076171875, 0.20867919921875, 0.3411865234375, 0.47369384765625, 0.606201171875, 0.73870849609375, 0.8712158203125, 1.00372314453125, 1.13623046875, 1.26873779296875, 1.4012451171875, 1.53375244140625, 1.666259765625, 1.79876708984375, 1.9312744140625, 2.06378173828125, 2.1962890625, 2.32879638671875, 2.4613037109375, 2.59381103515625, 2.726318359375, 2.85882568359375, 2.9913330078125, 3.12384033203125, 3.25634765625, 3.38885498046875, 3.5213623046875, 3.65386962890625, 3.786376953125, 3.91888427734375, 4.0513916015625, 4.18389892578125, 4.31640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 6.0, 20.0, 18.0, 28.0, 35.0, 75.0, 111.0, 142.0, 192.0, 304.0, 374.0, 552.0, 822.0, 1129.0, 1591.0, 2174.0, 3037.0, 4247.0, 5870.0, 8328.0, 11657.0, 16433.0, 22950.0, 32903.0, 46501.0, 67251.0, 98673.0, 143971.0, 1216559.0, 126525.0, 86144.0, 58743.0, 40545.0, 28828.0, 20181.0, 14312.0, 10166.0, 7416.0, 5186.0, 3760.0, 2686.0, 1893.0, 1375.0, 994.0, 678.0, 503.0, 376.0, 269.0, 170.0, 143.0, 96.0, 73.0, 42.0, 31.0, 16.0, 8.0, 13.0, 8.0, 3.0, 5.0], "bins": [-0.0596923828125, -0.0578455924987793, -0.055998802185058594, -0.05415201187133789, -0.05230522155761719, -0.050458431243896484, -0.04861164093017578, -0.04676485061645508, -0.044918060302734375, -0.04307126998901367, -0.04122447967529297, -0.039377689361572266, -0.03753089904785156, -0.03568410873413086, -0.033837318420410156, -0.03199052810668945, -0.03014373779296875, -0.028296947479248047, -0.026450157165527344, -0.02460336685180664, -0.022756576538085938, -0.020909786224365234, -0.01906299591064453, -0.017216205596923828, -0.015369415283203125, -0.013522624969482422, -0.011675834655761719, -0.009829044342041016, -0.007982254028320312, -0.006135463714599609, -0.004288673400878906, -0.002441883087158203, -0.0005950927734375, 0.0012516975402832031, 0.0030984878540039062, 0.004945278167724609, 0.0067920684814453125, 0.008638858795166016, 0.010485649108886719, 0.012332439422607422, 0.014179229736328125, 0.016026020050048828, 0.01787281036376953, 0.019719600677490234, 0.021566390991210938, 0.02341318130493164, 0.025259971618652344, 0.027106761932373047, 0.02895355224609375, 0.030800342559814453, 0.032647132873535156, 0.03449392318725586, 0.03634071350097656, 0.038187503814697266, 0.04003429412841797, 0.04188108444213867, 0.043727874755859375, 0.04557466506958008, 0.04742145538330078, 0.049268245697021484, 0.05111503601074219, 0.05296182632446289, 0.054808616638183594, 0.0566554069519043, 0.058502197265625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 6.0, 17.0, 28.0, 19.0, 28.0, 36.0, 53.0, 43.0, 69.0, 72.0, 76.0, 70.0, 77.0, 80.0, 51.0, 64.0, 52.0, 32.0, 28.0, 29.0, 14.0, 10.0, 14.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027441978454589844, -0.00026644766330718994, -0.00025847554206848145, -0.00025050342082977295, -0.00024253129959106445, -0.00023455917835235596, -0.00022658705711364746, -0.00021861493587493896, -0.00021064281463623047, -0.00020267069339752197, -0.00019469857215881348, -0.00018672645092010498, -0.00017875432968139648, -0.000170782208442688, -0.0001628100872039795, -0.000154837965965271, -0.0001468658447265625, -0.000138893723487854, -0.0001309216022491455, -0.000122949481010437, -0.00011497735977172852, -0.00010700523853302002, -9.903311729431152e-05, -9.106099605560303e-05, -8.308887481689453e-05, -7.511675357818604e-05, -6.714463233947754e-05, -5.917251110076904e-05, -5.120038986206055e-05, -4.322826862335205e-05, -3.5256147384643555e-05, -2.728402614593506e-05, -1.9311904907226562e-05, -1.1339783668518066e-05, -3.3676624298095703e-06, 4.604458808898926e-06, 1.2576580047607422e-05, 2.0548701286315918e-05, 2.8520822525024414e-05, 3.649294376373291e-05, 4.4465065002441406e-05, 5.24371862411499e-05, 6.04093074798584e-05, 6.83814287185669e-05, 7.635354995727539e-05, 8.432567119598389e-05, 9.229779243469238e-05, 0.00010026991367340088, 0.00010824203491210938, 0.00011621415615081787, 0.00012418627738952637, 0.00013215839862823486, 0.00014013051986694336, 0.00014810264110565186, 0.00015607476234436035, 0.00016404688358306885, 0.00017201900482177734, 0.00017999112606048584, 0.00018796324729919434, 0.00019593536853790283, 0.00020390748977661133, 0.00021187961101531982, 0.00021985173225402832, 0.00022782385349273682, 0.0002357959747314453]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 4.0, 12.0, 19.0, 24.0, 33.0, 58.0, 70.0, 107.0, 131.0, 186.0, 252.0, 302.0, 746.0, 13932.0, 1024165.0, 6674.0, 629.0, 304.0, 258.0, 159.0, 126.0, 104.0, 69.0, 51.0, 41.0, 26.0, 17.0, 10.0, 11.0, 11.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003814697265625, -0.0036893486976623535, -0.003564000129699707, -0.0034386515617370605, -0.003313302993774414, -0.0031879544258117676, -0.003062605857849121, -0.0029372572898864746, -0.002811908721923828, -0.0026865601539611816, -0.002561211585998535, -0.0024358630180358887, -0.002310514450073242, -0.0021851658821105957, -0.0020598173141479492, -0.0019344687461853027, -0.0018091201782226562, -0.0016837716102600098, -0.0015584230422973633, -0.0014330744743347168, -0.0013077259063720703, -0.0011823773384094238, -0.0010570287704467773, -0.0009316802024841309, -0.0008063316345214844, -0.0006809830665588379, -0.0005556344985961914, -0.0004302859306335449, -0.00030493736267089844, -0.00017958879470825195, -5.424022674560547e-05, 7.110834121704102e-05, 0.0001964569091796875, 0.000321805477142334, 0.00044715404510498047, 0.000572502613067627, 0.0006978511810302734, 0.0008231997489929199, 0.0009485483169555664, 0.0010738968849182129, 0.0011992454528808594, 0.0013245940208435059, 0.0014499425888061523, 0.0015752911567687988, 0.0017006397247314453, 0.0018259882926940918, 0.0019513368606567383, 0.0020766854286193848, 0.0022020339965820312, 0.0023273825645446777, 0.0024527311325073242, 0.0025780797004699707, 0.002703428268432617, 0.0028287768363952637, 0.00295412540435791, 0.0030794739723205566, 0.003204822540283203, 0.0033301711082458496, 0.003455519676208496, 0.0035808682441711426, 0.003706216812133789, 0.0038315653800964355, 0.003956913948059082, 0.0040822625160217285, 0.004207611083984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 592.0, 376.0, 27.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009625245584174991, -0.0009280359954573214, -0.0008935473742894828, -0.0008590588113293052, -0.0008245701901614666, -0.0007900816272012889, -0.0007555930642411113, -0.0007211044430732727, -0.000686615880113095, -0.0006521273171529174, -0.0006176386959850788, -0.0005831501330249012, -0.0005486615700647235, -0.0005141729488968849, -0.00047968438593670726, -0.00044519579387269914, -0.000410707201808691, -0.0003762186097446829, -0.0003417300176806748, -0.00030724145472049713, -0.000272752862656489, -0.0002382642705924809, -0.000203775693080388, -0.00016928711556829512, -0.000134798523504287, -0.0001003099387162365, -6.5821353928186e-05, -3.13327691401355e-05, 3.1558156479150057e-06, 3.764440771192312e-05, 7.213298522401601e-05, 0.0001066215627361089, 0.0001411100383847952, 0.0001755986304488033, 0.0002100872079608962, 0.0002445757854729891, 0.0002790643775369972, 0.0003135529696010053, 0.000348041532561183, 0.0003825301246251911, 0.0004170187166891992, 0.0004515073087532073, 0.00048599590081721544, 0.0005204844637773931, 0.0005549730267375708, 0.0005894616479054093, 0.000623950210865587, 0.0006584387738257647, 0.0006929273949936032, 0.0007274159579537809, 0.0007619045791216195, 0.0007963931420817971, 0.0008308817632496357, 0.0008653703262098134, 0.000899858889169991, 0.0009343475103378296, 0.0009688360732980072, 0.001003324636258185, 0.0010378132574260235, 0.001072301878593862, 0.0011067903833463788, 0.0011412790045142174, 0.001175767625682056, 0.0012102561304345727, 0.0012447447516024113]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 2.0, 12.0, 11.0, 15.0, 15.0, 18.0, 19.0, 25.0, 25.0, 25.0, 25.0, 29.0, 27.0, 49.0, 38.0, 32.0, 29.0, 32.0, 49.0, 33.0, 44.0, 29.0, 36.0, 32.0, 36.0, 25.0, 36.0, 30.0, 31.0, 20.0, 25.0, 21.0, 17.0, 21.0, 10.0, 14.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0001232624053955078, -0.00011950545012950897, -0.00011574849486351013, -0.00011199153959751129, -0.00010823458433151245, -0.00010447762906551361, -0.00010072067379951477, -9.696371853351593e-05, -9.320676326751709e-05, -8.944980800151825e-05, -8.569285273551941e-05, -8.193589746952057e-05, -7.817894220352173e-05, -7.442198693752289e-05, -7.066503167152405e-05, -6.690807640552521e-05, -6.315112113952637e-05, -5.939416587352753e-05, -5.5637210607528687e-05, -5.1880255341529846e-05, -4.8123300075531006e-05, -4.4366344809532166e-05, -4.0609389543533325e-05, -3.6852434277534485e-05, -3.3095479011535645e-05, -2.9338523745536804e-05, -2.5581568479537964e-05, -2.1824613213539124e-05, -1.8067657947540283e-05, -1.4310702681541443e-05, -1.0553747415542603e-05, -6.796792149543762e-06, -3.039836883544922e-06, 7.171183824539185e-07, 4.474073648452759e-06, 8.231028914451599e-06, 1.198798418045044e-05, 1.574493944644928e-05, 1.950189471244812e-05, 2.325884997844696e-05, 2.70158052444458e-05, 3.077276051044464e-05, 3.452971577644348e-05, 3.828667104244232e-05, 4.204362630844116e-05, 4.580058157444e-05, 4.955753684043884e-05, 5.331449210643768e-05, 5.7071447372436523e-05, 6.0828402638435364e-05, 6.45853579044342e-05, 6.834231317043304e-05, 7.209926843643188e-05, 7.585622370243073e-05, 7.961317896842957e-05, 8.33701342344284e-05, 8.712708950042725e-05, 9.088404476642609e-05, 9.464100003242493e-05, 9.839795529842377e-05, 0.00010215491056442261, 0.00010591186583042145, 0.00010966882109642029, 0.00011342577636241913, 0.00011718273162841797]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 10.0, 18.0, 20.0, 25.0, 26.0, 45.0, 52.0, 88.0, 93.0, 125.0, 162.0, 255.0, 360.0, 546.0, 820.0, 1244.0, 2252.0, 4049.0, 7867.0, 20317.0, 133324.0, 795785.0, 52976.0, 13671.0, 6022.0, 3120.0, 1843.0, 1136.0, 685.0, 457.0, 285.0, 215.0, 150.0, 125.0, 89.0, 75.0, 53.0, 43.0, 25.0, 21.0, 14.0, 13.0, 16.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0625, -14.6103515625, -14.158203125, -13.7060546875, -13.25390625, -12.8017578125, -12.349609375, -11.8974609375, -11.4453125, -10.9931640625, -10.541015625, -10.0888671875, -9.63671875, -9.1845703125, -8.732421875, -8.2802734375, -7.828125, -7.3759765625, -6.923828125, -6.4716796875, -6.01953125, -5.5673828125, -5.115234375, -4.6630859375, -4.2109375, -3.7587890625, -3.306640625, -2.8544921875, -2.40234375, -1.9501953125, -1.498046875, -1.0458984375, -0.59375, -0.1416015625, 0.310546875, 0.7626953125, 1.21484375, 1.6669921875, 2.119140625, 2.5712890625, 3.0234375, 3.4755859375, 3.927734375, 4.3798828125, 4.83203125, 5.2841796875, 5.736328125, 6.1884765625, 6.640625, 7.0927734375, 7.544921875, 7.9970703125, 8.44921875, 8.9013671875, 9.353515625, 9.8056640625, 10.2578125, 10.7099609375, 11.162109375, 11.6142578125, 12.06640625, 12.5185546875, 12.970703125, 13.4228515625, 13.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 8.0, 10.0, 18.0, 17.0, 19.0, 25.0, 20.0, 26.0, 44.0, 41.0, 44.0, 49.0, 56.0, 57.0, 109.0, 1715.0, 260.0, 87.0, 60.0, 43.0, 49.0, 40.0, 31.0, 24.0, 32.0, 28.0, 24.0, 17.0, 12.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-33.1875, -32.234375, -31.28125, -30.328125, -29.375, -28.421875, -27.46875, -26.515625, -25.5625, -24.609375, -23.65625, -22.703125, -21.75, -20.796875, -19.84375, -18.890625, -17.9375, -16.984375, -16.03125, -15.078125, -14.125, -13.171875, -12.21875, -11.265625, -10.3125, -9.359375, -8.40625, -7.453125, -6.5, -5.546875, -4.59375, -3.640625, -2.6875, -1.734375, -0.78125, 0.171875, 1.125, 2.078125, 3.03125, 3.984375, 4.9375, 5.890625, 6.84375, 7.796875, 8.75, 9.703125, 10.65625, 11.609375, 12.5625, 13.515625, 14.46875, 15.421875, 16.375, 17.328125, 18.28125, 19.234375, 20.1875, 21.140625, 22.09375, 23.046875, 24.0, 24.953125, 25.90625, 26.859375, 27.8125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 5.0, 9.0, 7.0, 4.0, 13.0, 15.0, 21.0, 27.0, 37.0, 47.0, 65.0, 80.0, 126.0, 286.0, 601.0, 1521.0, 6901.0, 88240.0, 3002830.0, 38095.0, 4433.0, 1152.0, 473.0, 257.0, 134.0, 82.0, 52.0, 41.0, 31.0, 24.0, 23.0, 13.0, 14.0, 12.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-40.78125, -39.39306640625, -38.0048828125, -36.61669921875, -35.228515625, -33.84033203125, -32.4521484375, -31.06396484375, -29.67578125, -28.28759765625, -26.8994140625, -25.51123046875, -24.123046875, -22.73486328125, -21.3466796875, -19.95849609375, -18.5703125, -17.18212890625, -15.7939453125, -14.40576171875, -13.017578125, -11.62939453125, -10.2412109375, -8.85302734375, -7.46484375, -6.07666015625, -4.6884765625, -3.30029296875, -1.912109375, -0.52392578125, 0.8642578125, 2.25244140625, 3.640625, 5.02880859375, 6.4169921875, 7.80517578125, 9.193359375, 10.58154296875, 11.9697265625, 13.35791015625, 14.74609375, 16.13427734375, 17.5224609375, 18.91064453125, 20.298828125, 21.68701171875, 23.0751953125, 24.46337890625, 25.8515625, 27.23974609375, 28.6279296875, 30.01611328125, 31.404296875, 32.79248046875, 34.1806640625, 35.56884765625, 36.95703125, 38.34521484375, 39.7333984375, 41.12158203125, 42.509765625, 43.89794921875, 45.2861328125, 46.67431640625, 48.0625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [8.0, 784.0, 221.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.034774780273438, -11.262662887573242, 2.509449005126953, 16.28156280517578, 30.053672790527344, 43.825782775878906, 57.597900390625, 71.37001037597656, 85.14212036132812, 98.91423034667969, 112.68634033203125, 126.45845794677734, 140.23056030273438, 154.002685546875, 167.77479553222656, 181.54690551757812, 195.3190155029297, 209.09112548828125, 222.8632354736328, 236.63534545898438, 250.407470703125, 264.1795654296875, 277.9516906738281, 291.72381591796875, 305.49591064453125, 319.2680358886719, 333.0401306152344, 346.812255859375, 360.5843505859375, 374.3564758300781, 388.12860107421875, 401.90069580078125, 415.67279052734375, 429.4449157714844, 443.2170104980469, 456.9891357421875, 470.76123046875, 484.5333557128906, 498.30548095703125, 512.0775756835938, 525.8496704101562, 539.6217651367188, 553.3939208984375, 567.166015625, 580.9381103515625, 594.710205078125, 608.4823608398438, 622.2544555664062, 636.026611328125, 649.7987060546875, 663.5708618164062, 677.3429565429688, 691.1150512695312, 704.8871459960938, 718.6593017578125, 732.431396484375, 746.2034912109375, 759.9755859375, 773.7477416992188, 787.5198364257812, 801.2919311523438, 815.0640258789062, 828.836181640625, 842.6082763671875, 856.38037109375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 12.0, 24.0, 22.0, 30.0, 33.0, 32.0, 26.0, 34.0, 32.0, 40.0, 35.0, 44.0, 59.0, 43.0, 38.0, 39.0, 48.0, 44.0, 36.0, 35.0, 28.0, 34.0, 27.0, 20.0, 24.0, 15.0, 11.0, 12.0, 18.0, 8.0, 7.0, 3.0, 5.0, 7.0, 0.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-100.16007232666016, -97.13978576660156, -94.11949920654297, -91.0992202758789, -88.07893371582031, -85.05864715576172, -82.03836059570312, -79.01808166503906, -75.99779510498047, -72.97750854492188, -69.95722198486328, -66.93694305419922, -63.916656494140625, -60.89636993408203, -57.87608337402344, -54.85580062866211, -51.835514068603516, -48.81522750854492, -45.794944763183594, -42.774658203125, -39.75437545776367, -36.73408889770508, -33.71380615234375, -30.693519592285156, -27.673234939575195, -24.652950286865234, -21.632665634155273, -18.612380981445312, -15.592095375061035, -12.571810722351074, -9.551525115966797, -6.531240463256836, -3.510955810546875, -0.49067091941833496, 2.529613971710205, 5.549899101257324, 8.570183753967285, 11.590468406677246, 14.610754013061523, 17.631038665771484, 20.651323318481445, 23.671607971191406, 26.691892623901367, 29.712177276611328, 32.73246383666992, 35.75274658203125, 38.773033142089844, 41.79331970214844, 44.813602447509766, 47.83388900756836, 50.85417175292969, 53.87445831298828, 56.89474105834961, 59.9150276184082, 62.93531036376953, 65.95559692382812, 68.97588348388672, 71.99617004394531, 75.0164566040039, 78.03673553466797, 81.05702209472656, 84.07730865478516, 87.09759521484375, 90.11787414550781, 93.1381607055664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 10.0, 9.0, 12.0, 13.0, 7.0, 15.0, 17.0, 27.0, 24.0, 31.0, 33.0, 44.0, 39.0, 53.0, 52.0, 51.0, 69.0, 60.0, 53.0, 50.0, 46.0, 39.0, 36.0, 28.0, 31.0, 17.0, 21.0, 14.0, 15.0, 14.0, 18.0, 10.0, 9.0, 1.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.989501953125, -8.70556640625, -8.421630859375, -8.1376953125, -7.853759765625, -7.56982421875, -7.285888671875, -7.001953125, -6.718017578125, -6.43408203125, -6.150146484375, -5.8662109375, -5.582275390625, -5.29833984375, -5.014404296875, -4.73046875, -4.446533203125, -4.16259765625, -3.878662109375, -3.5947265625, -3.310791015625, -3.02685546875, -2.742919921875, -2.458984375, -2.175048828125, -1.89111328125, -1.607177734375, -1.3232421875, -1.039306640625, -0.75537109375, -0.471435546875, -0.1875, 0.096435546875, 0.38037109375, 0.664306640625, 0.9482421875, 1.232177734375, 1.51611328125, 1.800048828125, 2.083984375, 2.367919921875, 2.65185546875, 2.935791015625, 3.2197265625, 3.503662109375, 3.78759765625, 4.071533203125, 4.35546875, 4.639404296875, 4.92333984375, 5.207275390625, 5.4912109375, 5.775146484375, 6.05908203125, 6.343017578125, 6.626953125, 6.910888671875, 7.19482421875, 7.478759765625, 7.7626953125, 8.046630859375, 8.33056640625, 8.614501953125, 8.8984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 14.0, 19.0, 21.0, 36.0, 49.0, 52.0, 123.0, 181.0, 282.0, 443.0, 717.0, 1189.0, 2148.0, 3988.0, 8250.0, 21876.0, 359691.0, 3592159.0, 170352.0, 17483.0, 7069.0, 3536.0, 1893.0, 1037.0, 646.0, 406.0, 192.0, 139.0, 80.0, 72.0, 30.0, 32.0, 21.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.67919921875, -32.6396484375, -31.60009765625, -30.560546875, -29.52099609375, -28.4814453125, -27.44189453125, -26.40234375, -25.36279296875, -24.3232421875, -23.28369140625, -22.244140625, -21.20458984375, -20.1650390625, -19.12548828125, -18.0859375, -17.04638671875, -16.0068359375, -14.96728515625, -13.927734375, -12.88818359375, -11.8486328125, -10.80908203125, -9.76953125, -8.72998046875, -7.6904296875, -6.65087890625, -5.611328125, -4.57177734375, -3.5322265625, -2.49267578125, -1.453125, -0.41357421875, 0.6259765625, 1.66552734375, 2.705078125, 3.74462890625, 4.7841796875, 5.82373046875, 6.86328125, 7.90283203125, 8.9423828125, 9.98193359375, 11.021484375, 12.06103515625, 13.1005859375, 14.14013671875, 15.1796875, 16.21923828125, 17.2587890625, 18.29833984375, 19.337890625, 20.37744140625, 21.4169921875, 22.45654296875, 23.49609375, 24.53564453125, 25.5751953125, 26.61474609375, 27.654296875, 28.69384765625, 29.7333984375, 30.77294921875, 31.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 8.0, 5.0, 4.0, 10.0, 18.0, 13.0, 20.0, 25.0, 41.0, 39.0, 50.0, 99.0, 193.0, 373.0, 714.0, 961.0, 674.0, 317.0, 164.0, 71.0, 58.0, 27.0, 40.0, 24.0, 15.0, 26.0, 7.0, 11.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.296875, -24.516357421875, -23.73583984375, -22.955322265625, -22.1748046875, -21.394287109375, -20.61376953125, -19.833251953125, -19.052734375, -18.272216796875, -17.49169921875, -16.711181640625, -15.9306640625, -15.150146484375, -14.36962890625, -13.589111328125, -12.80859375, -12.028076171875, -11.24755859375, -10.467041015625, -9.6865234375, -8.906005859375, -8.12548828125, -7.344970703125, -6.564453125, -5.783935546875, -5.00341796875, -4.222900390625, -3.4423828125, -2.661865234375, -1.88134765625, -1.100830078125, -0.3203125, 0.460205078125, 1.24072265625, 2.021240234375, 2.8017578125, 3.582275390625, 4.36279296875, 5.143310546875, 5.923828125, 6.704345703125, 7.48486328125, 8.265380859375, 9.0458984375, 9.826416015625, 10.60693359375, 11.387451171875, 12.16796875, 12.948486328125, 13.72900390625, 14.509521484375, 15.2900390625, 16.070556640625, 16.85107421875, 17.631591796875, 18.412109375, 19.192626953125, 19.97314453125, 20.753662109375, 21.5341796875, 22.314697265625, 23.09521484375, 23.875732421875, 24.65625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 12.0, 15.0, 21.0, 24.0, 37.0, 55.0, 80.0, 112.0, 170.0, 239.0, 394.0, 579.0, 991.0, 1620.0, 2848.0, 5362.0, 10841.0, 24947.0, 76530.0, 751621.0, 3064432.0, 179383.0, 40918.0, 16001.0, 7619.0, 3890.0, 2113.0, 1257.0, 781.0, 501.0, 303.0, 168.0, 99.0, 63.0, 62.0, 46.0, 36.0, 27.0, 21.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.6875, -29.73583984375, -28.7841796875, -27.83251953125, -26.880859375, -25.92919921875, -24.9775390625, -24.02587890625, -23.07421875, -22.12255859375, -21.1708984375, -20.21923828125, -19.267578125, -18.31591796875, -17.3642578125, -16.41259765625, -15.4609375, -14.50927734375, -13.5576171875, -12.60595703125, -11.654296875, -10.70263671875, -9.7509765625, -8.79931640625, -7.84765625, -6.89599609375, -5.9443359375, -4.99267578125, -4.041015625, -3.08935546875, -2.1376953125, -1.18603515625, -0.234375, 0.71728515625, 1.6689453125, 2.62060546875, 3.572265625, 4.52392578125, 5.4755859375, 6.42724609375, 7.37890625, 8.33056640625, 9.2822265625, 10.23388671875, 11.185546875, 12.13720703125, 13.0888671875, 14.04052734375, 14.9921875, 15.94384765625, 16.8955078125, 17.84716796875, 18.798828125, 19.75048828125, 20.7021484375, 21.65380859375, 22.60546875, 23.55712890625, 24.5087890625, 25.46044921875, 26.412109375, 27.36376953125, 28.3154296875, 29.26708984375, 30.21875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 26.0, 34.0, 68.0, 128.0, 190.0, 204.0, 133.0, 68.0, 56.0, 25.0, 17.0, 15.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.36418151855469, -74.26775360107422, -70.17131805419922, -66.07489013671875, -61.978458404541016, -57.88202667236328, -53.78559875488281, -49.68916702270508, -45.592735290527344, -41.49630355834961, -37.399871826171875, -33.303443908691406, -29.207012176513672, -25.110580444335938, -21.014150619506836, -16.917720794677734, -12.8212890625, -8.724858283996582, -4.628427505493164, -0.5319967269897461, 3.564434051513672, 7.660865783691406, 11.757295608520508, 15.85372543334961, 19.950157165527344, 24.046588897705078, 28.14301872253418, 32.23944854736328, 36.335880279541016, 40.43231201171875, 44.52873992919922, 48.62517166137695, 52.72160339355469, 56.81803512573242, 60.914466857910156, 65.01089477539062, 69.10733032226562, 73.2037582397461, 77.30018615722656, 81.39662170410156, 85.49304962158203, 89.5894775390625, 93.6859130859375, 97.78234100341797, 101.87876892089844, 105.97520446777344, 110.0716323852539, 114.16806030273438, 118.26449584960938, 122.36092376708984, 126.45735931396484, 130.5537872314453, 134.6502227783203, 138.74664306640625, 142.84307861328125, 146.93951416015625, 151.03594970703125, 155.13238525390625, 159.2288055419922, 163.3252410888672, 167.4216766357422, 171.51809692382812, 175.61453247070312, 179.71096801757812, 183.80738830566406]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 9.0, 5.0, 8.0, 13.0, 10.0, 15.0, 13.0, 19.0, 22.0, 21.0, 24.0, 28.0, 51.0, 38.0, 32.0, 39.0, 43.0, 54.0, 48.0, 43.0, 44.0, 51.0, 49.0, 33.0, 28.0, 35.0, 32.0, 24.0, 23.0, 20.0, 17.0, 25.0, 20.0, 17.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.7494125366211, -75.25308990478516, -72.75676727294922, -70.26044464111328, -67.76412200927734, -65.2677993774414, -62.771480560302734, -60.2751579284668, -57.77883529663086, -55.28251266479492, -52.786190032958984, -50.28986740112305, -47.793548583984375, -45.29722595214844, -42.8009033203125, -40.30458068847656, -37.808258056640625, -35.31193542480469, -32.81561279296875, -30.319292068481445, -27.822969436645508, -25.32664680480957, -22.830326080322266, -20.334003448486328, -17.83768081665039, -15.341358184814453, -12.845036506652832, -10.348714828491211, -7.852392196655273, -5.356069564819336, -2.859747886657715, -0.36342620849609375, 2.132904052734375, 4.629226207733154, 7.125548362731934, 9.621870040893555, 12.118192672729492, 14.61451530456543, 17.110836029052734, 19.607158660888672, 22.10348129272461, 24.599803924560547, 27.096126556396484, 29.59244728088379, 32.088768005371094, 34.58509063720703, 37.08141326904297, 39.577735900878906, 42.074058532714844, 44.57038116455078, 47.06670379638672, 49.563026428222656, 52.059349060058594, 54.55567169189453, 57.0519905090332, 59.54831314086914, 62.04463577270508, 64.54095458984375, 67.03727722167969, 69.53359985351562, 72.02992248535156, 74.5262451171875, 77.02256774902344, 79.51889038085938, 82.01521301269531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 6.0, 12.0, 22.0, 20.0, 42.0, 56.0, 89.0, 119.0, 148.0, 227.0, 332.0, 483.0, 707.0, 1091.0, 1575.0, 2533.0, 3892.0, 6016.0, 9637.0, 15729.0, 25848.0, 43997.0, 76285.0, 139091.0, 253598.0, 204781.0, 108949.0, 60888.0, 35645.0, 21217.0, 12990.0, 7984.0, 4994.0, 3230.0, 2090.0, 1364.0, 880.0, 654.0, 417.0, 278.0, 171.0, 150.0, 94.0, 78.0, 54.0, 25.0, 16.0, 15.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.1756591796875, -0.170135498046875, -0.16461181640625, -0.159088134765625, -0.153564453125, -0.148040771484375, -0.14251708984375, -0.136993408203125, -0.1314697265625, -0.125946044921875, -0.12042236328125, -0.114898681640625, -0.109375, -0.103851318359375, -0.09832763671875, -0.092803955078125, -0.0872802734375, -0.081756591796875, -0.07623291015625, -0.070709228515625, -0.065185546875, -0.059661865234375, -0.05413818359375, -0.048614501953125, -0.0430908203125, -0.037567138671875, -0.03204345703125, -0.026519775390625, -0.02099609375, -0.015472412109375, -0.00994873046875, -0.004425048828125, 0.0010986328125, 0.006622314453125, 0.01214599609375, 0.017669677734375, 0.023193359375, 0.028717041015625, 0.03424072265625, 0.039764404296875, 0.0452880859375, 0.050811767578125, 0.05633544921875, 0.061859130859375, 0.0673828125, 0.072906494140625, 0.07843017578125, 0.083953857421875, 0.0894775390625, 0.095001220703125, 0.10052490234375, 0.106048583984375, 0.111572265625, 0.117095947265625, 0.12261962890625, 0.128143310546875, 0.1336669921875, 0.139190673828125, 0.14471435546875, 0.150238037109375, 0.15576171875, 0.161285400390625, 0.16680908203125, 0.172332763671875, 0.1778564453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 9.0, 12.0, 8.0, 9.0, 10.0, 20.0, 25.0, 23.0, 17.0, 20.0, 21.0, 42.0, 33.0, 36.0, 28.0, 23.0, 36.0, 44.0, 45.0, 1068.0, 40.0, 38.0, 45.0, 36.0, 34.0, 37.0, 30.0, 26.0, 25.0, 22.0, 20.0, 15.0, 17.0, 14.0, 15.0, 9.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.966796875, -3.832489013671875, -3.69818115234375, -3.563873291015625, -3.4295654296875, -3.295257568359375, -3.16094970703125, -3.026641845703125, -2.892333984375, -2.758026123046875, -2.62371826171875, -2.489410400390625, -2.3551025390625, -2.220794677734375, -2.08648681640625, -1.952178955078125, -1.81787109375, -1.683563232421875, -1.54925537109375, -1.414947509765625, -1.2806396484375, -1.146331787109375, -1.01202392578125, -0.877716064453125, -0.743408203125, -0.609100341796875, -0.47479248046875, -0.340484619140625, -0.2061767578125, -0.071868896484375, 0.06243896484375, 0.196746826171875, 0.3310546875, 0.465362548828125, 0.59967041015625, 0.733978271484375, 0.8682861328125, 1.002593994140625, 1.13690185546875, 1.271209716796875, 1.405517578125, 1.539825439453125, 1.67413330078125, 1.808441162109375, 1.9427490234375, 2.077056884765625, 2.21136474609375, 2.345672607421875, 2.47998046875, 2.614288330078125, 2.74859619140625, 2.882904052734375, 3.0172119140625, 3.151519775390625, 3.28582763671875, 3.420135498046875, 3.554443359375, 3.688751220703125, 3.82305908203125, 3.957366943359375, 4.0916748046875, 4.225982666015625, 4.36029052734375, 4.494598388671875, 4.62890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 11.0, 21.0, 23.0, 41.0, 50.0, 96.0, 111.0, 176.0, 277.0, 358.0, 588.0, 831.0, 1226.0, 1828.0, 2790.0, 4219.0, 6322.0, 9228.0, 14474.0, 21146.0, 32230.0, 48487.0, 74877.0, 118717.0, 812722.0, 608040.0, 118561.0, 75053.0, 49034.0, 31870.0, 21376.0, 14130.0, 9433.0, 6196.0, 4052.0, 2791.0, 1875.0, 1230.0, 857.0, 595.0, 389.0, 265.0, 173.0, 117.0, 85.0, 53.0, 37.0, 27.0, 14.0, 12.0, 3.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06763076782226562, -0.06537628173828125, -0.06312179565429688, -0.0608673095703125, -0.058612823486328125, -0.05635833740234375, -0.054103851318359375, -0.051849365234375, -0.049594879150390625, -0.04734039306640625, -0.045085906982421875, -0.0428314208984375, -0.040576934814453125, -0.03832244873046875, -0.036067962646484375, -0.0338134765625, -0.031558990478515625, -0.02930450439453125, -0.027050018310546875, -0.0247955322265625, -0.022541046142578125, -0.02028656005859375, -0.018032073974609375, -0.015777587890625, -0.013523101806640625, -0.01126861572265625, -0.009014129638671875, -0.0067596435546875, -0.004505157470703125, -0.00225067138671875, 3.814697265625e-06, 0.00225830078125, 0.004512786865234375, 0.00676727294921875, 0.009021759033203125, 0.0112762451171875, 0.013530731201171875, 0.01578521728515625, 0.018039703369140625, 0.020294189453125, 0.022548675537109375, 0.02480316162109375, 0.027057647705078125, 0.0293121337890625, 0.031566619873046875, 0.03382110595703125, 0.036075592041015625, 0.038330078125, 0.040584564208984375, 0.04283905029296875, 0.045093536376953125, 0.0473480224609375, 0.049602508544921875, 0.05185699462890625, 0.054111480712890625, 0.056365966796875, 0.058620452880859375, 0.06087493896484375, 0.06312942504882812, 0.0653839111328125, 0.06763839721679688, 0.06989288330078125, 0.07214736938476562, 0.07440185546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 19.0, 17.0, 26.0, 30.0, 39.0, 52.0, 54.0, 88.0, 81.0, 71.0, 65.0, 76.0, 77.0, 77.0, 60.0, 43.0, 26.0, 25.0, 17.0, 17.0, 11.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003476142883300781, -0.0003368891775608063, -0.0003261640667915344, -0.0003154389560222626, -0.0003047138452529907, -0.00029398873448371887, -0.000283263623714447, -0.00027253851294517517, -0.0002618134021759033, -0.00025108829140663147, -0.00024036318063735962, -0.00022963806986808777, -0.00021891295909881592, -0.00020818784832954407, -0.00019746273756027222, -0.00018673762679100037, -0.00017601251602172852, -0.00016528740525245667, -0.00015456229448318481, -0.00014383718371391296, -0.0001331120729446411, -0.00012238696217536926, -0.00011166185140609741, -0.00010093674063682556, -9.021162986755371e-05, -7.948651909828186e-05, -6.876140832901001e-05, -5.803629755973816e-05, -4.731118679046631e-05, -3.658607602119446e-05, -2.5860965251922607e-05, -1.5135854482650757e-05, -4.410743713378906e-06, 6.314367055892944e-06, 1.7039477825164795e-05, 2.7764588594436646e-05, 3.8489699363708496e-05, 4.921481013298035e-05, 5.99399209022522e-05, 7.066503167152405e-05, 8.13901424407959e-05, 9.211525321006775e-05, 0.0001028403639793396, 0.00011356547474861145, 0.0001242905855178833, 0.00013501569628715515, 0.000145740807056427, 0.00015646591782569885, 0.0001671910285949707, 0.00017791613936424255, 0.0001886412501335144, 0.00019936636090278625, 0.0002100914716720581, 0.00022081658244132996, 0.0002315416932106018, 0.00024226680397987366, 0.0002529919147491455, 0.00026371702551841736, 0.0002744421362876892, 0.00028516724705696106, 0.0002958923578262329, 0.00030661746859550476, 0.0003173425793647766, 0.00032806769013404846, 0.0003387928009033203]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 39.0, 70.0, 80.0, 125.0, 167.0, 250.0, 350.0, 727.0, 9486.0, 1025911.0, 9432.0, 773.0, 338.0, 215.0, 144.0, 126.0, 76.0, 61.0, 39.0, 35.0, 19.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052642822265625, -0.005097150802612305, -0.004930019378662109, -0.004762887954711914, -0.004595756530761719, -0.0044286251068115234, -0.004261493682861328, -0.004094362258911133, -0.0039272308349609375, -0.003760099411010742, -0.003592967987060547, -0.0034258365631103516, -0.0032587051391601562, -0.003091573715209961, -0.0029244422912597656, -0.0027573108673095703, -0.002590179443359375, -0.0024230480194091797, -0.0022559165954589844, -0.002088785171508789, -0.0019216537475585938, -0.0017545223236083984, -0.0015873908996582031, -0.0014202594757080078, -0.0012531280517578125, -0.0010859966278076172, -0.0009188652038574219, -0.0007517337799072266, -0.0005846023559570312, -0.00041747093200683594, -0.0002503395080566406, -8.320808410644531e-05, 8.392333984375e-05, 0.0002510547637939453, 0.0004181861877441406, 0.0005853176116943359, 0.0007524490356445312, 0.0009195804595947266, 0.0010867118835449219, 0.0012538433074951172, 0.0014209747314453125, 0.0015881061553955078, 0.0017552375793457031, 0.0019223690032958984, 0.0020895004272460938, 0.002256631851196289, 0.0024237632751464844, 0.0025908946990966797, 0.002758026123046875, 0.0029251575469970703, 0.0030922889709472656, 0.003259420394897461, 0.0034265518188476562, 0.0035936832427978516, 0.003760814666748047, 0.003927946090698242, 0.0040950775146484375, 0.004262208938598633, 0.004429340362548828, 0.0045964717864990234, 0.004763603210449219, 0.004930734634399414, 0.005097866058349609, 0.005264997482299805, 0.00543212890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 60.0, 900.0, 51.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.003988742362707853, -0.003920490853488445, -0.0038522391114383936, -0.003783987369388342, -0.003715735860168934, -0.003647484118118882, -0.003579232608899474, -0.0035109808668494225, -0.0034427293576300144, -0.0033744776155799627, -0.0033062261063605547, -0.003237974364310503, -0.003169722855091095, -0.0031014711130410433, -0.0030332196038216352, -0.0029649678617715836, -0.0028967163525521755, -0.002828464610502124, -0.002760213101282716, -0.002691961359232664, -0.002623709850013256, -0.0025554581079632044, -0.0024872065987437963, -0.0024189548566937447, -0.002350703114643693, -0.0022824513725936413, -0.0022141998633742332, -0.0021459481213241816, -0.0020776966121047735, -0.002009444870054722, -0.0019411933608353138, -0.001872941618785262, -0.0018046898767352104, -0.0017364382511004806, -0.0016681866254657507, -0.0015999349998310208, -0.001531683374196291, -0.001463431748561561, -0.0013951801229268312, -0.0013269283808767796, -0.0012586768716573715, -0.0011904252460226417, -0.0011221736203879118, -0.001053921994753182, -0.000985670369118452, -0.0009174187434837222, -0.0008491670596413314, -0.0007809154340066016, -0.0007126637501642108, -0.0006444121245294809, -0.0005761604988947511, -0.0005079088732600212, -0.0004396572185214609, -0.00037140559288673103, -0.0003031539381481707, -0.00023490231251344085, -0.00016665071598254144, -9.839908307185397e-05, -3.014745016116649e-05, 3.81041900254786e-05, 0.00010635581566020846, 0.00017460744129493833, 0.00024285909603349864, 0.0003111107216682285, 0.00037936234730295837]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 5.0, 14.0, 12.0, 18.0, 27.0, 23.0, 20.0, 23.0, 33.0, 45.0, 41.0, 47.0, 43.0, 47.0, 44.0, 50.0, 45.0, 58.0, 44.0, 43.0, 42.0, 38.0, 32.0, 32.0, 25.0, 18.0, 22.0, 21.0, 18.0, 12.0, 10.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001506805419921875, -0.0001443866640329361, -0.0001380927860736847, -0.0001317989081144333, -0.00012550503015518188, -0.00011921115219593048, -0.00011291727423667908, -0.00010662339627742767, -0.00010032951831817627, -9.403564035892487e-05, -8.774176239967346e-05, -8.144788444042206e-05, -7.515400648117065e-05, -6.886012852191925e-05, -6.256625056266785e-05, -5.627237260341644e-05, -4.997849464416504e-05, -4.3684616684913635e-05, -3.739073872566223e-05, -3.109686076641083e-05, -2.4802982807159424e-05, -1.850910484790802e-05, -1.2215226888656616e-05, -5.921348929405212e-06, 3.725290298461914e-07, 6.666406989097595e-06, 1.2960284948348999e-05, 1.9254162907600403e-05, 2.5548040866851807e-05, 3.184191882610321e-05, 3.8135796785354614e-05, 4.442967474460602e-05, 5.072355270385742e-05, 5.7017430663108826e-05, 6.331130862236023e-05, 6.960518658161163e-05, 7.589906454086304e-05, 8.219294250011444e-05, 8.848682045936584e-05, 9.478069841861725e-05, 0.00010107457637786865, 0.00010736845433712006, 0.00011366233229637146, 0.00011995621025562286, 0.00012625008821487427, 0.00013254396617412567, 0.00013883784413337708, 0.00014513172209262848, 0.00015142560005187988, 0.0001577194780111313, 0.0001640133559703827, 0.0001703072339296341, 0.0001766011118888855, 0.0001828949898481369, 0.0001891888678073883, 0.0001954827457666397, 0.0002017766237258911, 0.00020807050168514252, 0.00021436437964439392, 0.00022065825760364532, 0.00022695213556289673, 0.00023324601352214813, 0.00023953989148139954, 0.00024583376944065094, 0.00025212764739990234]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 15.0, 11.0, 22.0, 29.0, 37.0, 62.0, 86.0, 113.0, 164.0, 235.0, 353.0, 473.0, 737.0, 1001.0, 1566.0, 2422.0, 3934.0, 6848.0, 14223.0, 38858.0, 296877.0, 592431.0, 51325.0, 16629.0, 7850.0, 4350.0, 2586.0, 1661.0, 1118.0, 775.0, 544.0, 379.0, 221.0, 199.0, 130.0, 95.0, 50.0, 40.0, 22.0, 21.0, 17.0, 18.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.765625, -17.1943359375, -16.623046875, -16.0517578125, -15.48046875, -14.9091796875, -14.337890625, -13.7666015625, -13.1953125, -12.6240234375, -12.052734375, -11.4814453125, -10.91015625, -10.3388671875, -9.767578125, -9.1962890625, -8.625, -8.0537109375, -7.482421875, -6.9111328125, -6.33984375, -5.7685546875, -5.197265625, -4.6259765625, -4.0546875, -3.4833984375, -2.912109375, -2.3408203125, -1.76953125, -1.1982421875, -0.626953125, -0.0556640625, 0.515625, 1.0869140625, 1.658203125, 2.2294921875, 2.80078125, 3.3720703125, 3.943359375, 4.5146484375, 5.0859375, 5.6572265625, 6.228515625, 6.7998046875, 7.37109375, 7.9423828125, 8.513671875, 9.0849609375, 9.65625, 10.2275390625, 10.798828125, 11.3701171875, 11.94140625, 12.5126953125, 13.083984375, 13.6552734375, 14.2265625, 14.7978515625, 15.369140625, 15.9404296875, 16.51171875, 17.0830078125, 17.654296875, 18.2255859375, 18.796875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 13.0, 17.0, 17.0, 25.0, 12.0, 19.0, 23.0, 26.0, 34.0, 51.0, 56.0, 60.0, 79.0, 154.0, 1537.0, 315.0, 132.0, 67.0, 57.0, 48.0, 30.0, 21.0, 35.0, 38.0, 16.0, 19.0, 12.0, 19.0, 23.0, 14.0, 16.0, 13.0, 6.0, 13.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-31.8125, -30.873046875, -29.93359375, -28.994140625, -28.0546875, -27.115234375, -26.17578125, -25.236328125, -24.296875, -23.357421875, -22.41796875, -21.478515625, -20.5390625, -19.599609375, -18.66015625, -17.720703125, -16.78125, -15.841796875, -14.90234375, -13.962890625, -13.0234375, -12.083984375, -11.14453125, -10.205078125, -9.265625, -8.326171875, -7.38671875, -6.447265625, -5.5078125, -4.568359375, -3.62890625, -2.689453125, -1.75, -0.810546875, 0.12890625, 1.068359375, 2.0078125, 2.947265625, 3.88671875, 4.826171875, 5.765625, 6.705078125, 7.64453125, 8.583984375, 9.5234375, 10.462890625, 11.40234375, 12.341796875, 13.28125, 14.220703125, 15.16015625, 16.099609375, 17.0390625, 17.978515625, 18.91796875, 19.857421875, 20.796875, 21.736328125, 22.67578125, 23.615234375, 24.5546875, 25.494140625, 26.43359375, 27.373046875, 28.3125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 8.0, 13.0, 10.0, 20.0, 9.0, 26.0, 12.0, 22.0, 39.0, 61.0, 77.0, 106.0, 234.0, 533.0, 1433.0, 5015.0, 25698.0, 2263933.0, 821314.0, 20573.0, 4247.0, 1296.0, 489.0, 201.0, 110.0, 57.0, 32.0, 23.0, 17.0, 20.0, 19.0, 15.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.4462890625, -39.048828125, -37.6513671875, -36.25390625, -34.8564453125, -33.458984375, -32.0615234375, -30.6640625, -29.2666015625, -27.869140625, -26.4716796875, -25.07421875, -23.6767578125, -22.279296875, -20.8818359375, -19.484375, -18.0869140625, -16.689453125, -15.2919921875, -13.89453125, -12.4970703125, -11.099609375, -9.7021484375, -8.3046875, -6.9072265625, -5.509765625, -4.1123046875, -2.71484375, -1.3173828125, 0.080078125, 1.4775390625, 2.875, 4.2724609375, 5.669921875, 7.0673828125, 8.46484375, 9.8623046875, 11.259765625, 12.6572265625, 14.0546875, 15.4521484375, 16.849609375, 18.2470703125, 19.64453125, 21.0419921875, 22.439453125, 23.8369140625, 25.234375, 26.6318359375, 28.029296875, 29.4267578125, 30.82421875, 32.2216796875, 33.619140625, 35.0166015625, 36.4140625, 37.8115234375, 39.208984375, 40.6064453125, 42.00390625, 43.4013671875, 44.798828125, 46.1962890625, 47.59375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 15.0, 36.0, 52.0, 68.0, 150.0, 181.0, 196.0, 139.0, 68.0, 40.0, 25.0, 10.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.12922668457031, -69.99588012695312, -67.86253356933594, -65.72918701171875, -63.59584426879883, -61.46249771118164, -59.32915115356445, -57.195804595947266, -55.062461853027344, -52.929115295410156, -50.79576873779297, -48.66242218017578, -46.52907943725586, -44.39573287963867, -42.262386322021484, -40.1290397644043, -37.99569320678711, -35.86234664916992, -33.729000091552734, -31.59565544128418, -29.462310791015625, -27.328964233398438, -25.19561767578125, -23.062271118164062, -20.928926467895508, -18.79557991027832, -16.662235260009766, -14.528888702392578, -12.395543098449707, -10.262197494506836, -8.128850936889648, -5.995505332946777, -3.8621597290039062, -1.728813886642456, 0.40453195571899414, 2.5378780364990234, 4.6712236404418945, 6.804569244384766, 8.937915802001953, 11.071261405944824, 13.204607009887695, 15.337952613830566, 17.471298217773438, 19.604644775390625, 21.737991333007812, 23.871335983276367, 26.004682540893555, 28.13802719116211, 30.271373748779297, 32.404720306396484, 34.53806686401367, 36.671409606933594, 38.80475616455078, 40.93810272216797, 43.071449279785156, 45.204795837402344, 47.33814239501953, 49.47148895263672, 51.604835510253906, 53.738182067871094, 55.871524810791016, 58.0048713684082, 60.13821792602539, 62.27156448364258, 64.4049072265625]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 17.0, 18.0, 18.0, 21.0, 30.0, 29.0, 28.0, 39.0, 29.0, 51.0, 33.0, 37.0, 29.0, 30.0, 46.0, 42.0, 40.0, 36.0, 28.0, 34.0, 27.0, 45.0, 19.0, 29.0, 24.0, 21.0, 23.0, 17.0, 15.0, 10.0, 9.0, 16.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.57829284667969, -83.71070861816406, -80.84313201904297, -77.97555541992188, -75.10797119140625, -72.24038696289062, -69.37281036376953, -66.50523376464844, -63.63764953613281, -60.77006912231445, -57.902488708496094, -55.034908294677734, -52.167327880859375, -49.299747467041016, -46.432167053222656, -43.5645866394043, -40.69700622558594, -37.82942581176758, -34.96184539794922, -32.09426498413086, -29.2266845703125, -26.35910415649414, -23.49152374267578, -20.623943328857422, -17.756362915039062, -14.888782501220703, -12.021202087402344, -9.153621673583984, -6.286041259765625, -3.4184608459472656, -0.5508804321289062, 2.316699981689453, 5.184288024902344, 8.051868438720703, 10.919448852539062, 13.787029266357422, 16.65460968017578, 19.52219009399414, 22.3897705078125, 25.25735092163086, 28.12493133544922, 30.992511749267578, 33.86009216308594, 36.7276725769043, 39.595252990722656, 42.462833404541016, 45.330413818359375, 48.197994232177734, 51.065574645996094, 53.93315505981445, 56.80073547363281, 59.66831588745117, 62.53589630126953, 65.40347290039062, 68.27105712890625, 71.13864135742188, 74.00621795654297, 76.87379455566406, 79.74137878417969, 82.60896301269531, 85.4765396118164, 88.3441162109375, 91.21170043945312, 94.07928466796875, 96.94686126708984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 8.0, 15.0, 9.0, 16.0, 22.0, 11.0, 16.0, 34.0, 28.0, 29.0, 39.0, 33.0, 34.0, 40.0, 47.0, 56.0, 47.0, 54.0, 53.0, 41.0, 48.0, 41.0, 39.0, 39.0, 31.0, 21.0, 22.0, 15.0, 15.0, 13.0, 20.0, 9.0, 8.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.21875, -8.94580078125, -8.6728515625, -8.39990234375, -8.126953125, -7.85400390625, -7.5810546875, -7.30810546875, -7.03515625, -6.76220703125, -6.4892578125, -6.21630859375, -5.943359375, -5.67041015625, -5.3974609375, -5.12451171875, -4.8515625, -4.57861328125, -4.3056640625, -4.03271484375, -3.759765625, -3.48681640625, -3.2138671875, -2.94091796875, -2.66796875, -2.39501953125, -2.1220703125, -1.84912109375, -1.576171875, -1.30322265625, -1.0302734375, -0.75732421875, -0.484375, -0.21142578125, 0.0615234375, 0.33447265625, 0.607421875, 0.88037109375, 1.1533203125, 1.42626953125, 1.69921875, 1.97216796875, 2.2451171875, 2.51806640625, 2.791015625, 3.06396484375, 3.3369140625, 3.60986328125, 3.8828125, 4.15576171875, 4.4287109375, 4.70166015625, 4.974609375, 5.24755859375, 5.5205078125, 5.79345703125, 6.06640625, 6.33935546875, 6.6123046875, 6.88525390625, 7.158203125, 7.43115234375, 7.7041015625, 7.97705078125, 8.25]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 12.0, 14.0, 13.0, 11.0, 19.0, 33.0, 47.0, 62.0, 95.0, 136.0, 200.0, 272.0, 396.0, 711.0, 1036.0, 1809.0, 3270.0, 6465.0, 15968.0, 155846.0, 2938556.0, 996271.0, 51313.0, 10378.0, 4830.0, 2582.0, 1520.0, 880.0, 536.0, 319.0, 218.0, 129.0, 95.0, 76.0, 40.0, 32.0, 30.0, 10.0, 8.0, 11.0, 10.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.140625, -26.33740234375, -25.5341796875, -24.73095703125, -23.927734375, -23.12451171875, -22.3212890625, -21.51806640625, -20.71484375, -19.91162109375, -19.1083984375, -18.30517578125, -17.501953125, -16.69873046875, -15.8955078125, -15.09228515625, -14.2890625, -13.48583984375, -12.6826171875, -11.87939453125, -11.076171875, -10.27294921875, -9.4697265625, -8.66650390625, -7.86328125, -7.06005859375, -6.2568359375, -5.45361328125, -4.650390625, -3.84716796875, -3.0439453125, -2.24072265625, -1.4375, -0.63427734375, 0.1689453125, 0.97216796875, 1.775390625, 2.57861328125, 3.3818359375, 4.18505859375, 4.98828125, 5.79150390625, 6.5947265625, 7.39794921875, 8.201171875, 9.00439453125, 9.8076171875, 10.61083984375, 11.4140625, 12.21728515625, 13.0205078125, 13.82373046875, 14.626953125, 15.43017578125, 16.2333984375, 17.03662109375, 17.83984375, 18.64306640625, 19.4462890625, 20.24951171875, 21.052734375, 21.85595703125, 22.6591796875, 23.46240234375, 24.265625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 7.0, 18.0, 31.0, 33.0, 43.0, 71.0, 109.0, 229.0, 532.0, 972.0, 972.0, 484.0, 200.0, 110.0, 71.0, 42.0, 26.0, 19.0, 18.0, 18.0, 9.0, 7.0, 7.0, 8.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.21875, -27.27685546875, -26.3349609375, -25.39306640625, -24.451171875, -23.50927734375, -22.5673828125, -21.62548828125, -20.68359375, -19.74169921875, -18.7998046875, -17.85791015625, -16.916015625, -15.97412109375, -15.0322265625, -14.09033203125, -13.1484375, -12.20654296875, -11.2646484375, -10.32275390625, -9.380859375, -8.43896484375, -7.4970703125, -6.55517578125, -5.61328125, -4.67138671875, -3.7294921875, -2.78759765625, -1.845703125, -0.90380859375, 0.0380859375, 0.97998046875, 1.921875, 2.86376953125, 3.8056640625, 4.74755859375, 5.689453125, 6.63134765625, 7.5732421875, 8.51513671875, 9.45703125, 10.39892578125, 11.3408203125, 12.28271484375, 13.224609375, 14.16650390625, 15.1083984375, 16.05029296875, 16.9921875, 17.93408203125, 18.8759765625, 19.81787109375, 20.759765625, 21.70166015625, 22.6435546875, 23.58544921875, 24.52734375, 25.46923828125, 26.4111328125, 27.35302734375, 28.294921875, 29.23681640625, 30.1787109375, 31.12060546875, 32.0625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 13.0, 18.0, 31.0, 38.0, 56.0, 89.0, 158.0, 240.0, 439.0, 845.0, 1727.0, 4080.0, 10167.0, 34134.0, 247548.0, 3588725.0, 253167.0, 34632.0, 10528.0, 3981.0, 1755.0, 772.0, 449.0, 293.0, 137.0, 102.0, 49.0, 32.0, 13.0, 14.0, 7.0, 5.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.78125, -40.5341796875, -39.287109375, -38.0400390625, -36.79296875, -35.5458984375, -34.298828125, -33.0517578125, -31.8046875, -30.5576171875, -29.310546875, -28.0634765625, -26.81640625, -25.5693359375, -24.322265625, -23.0751953125, -21.828125, -20.5810546875, -19.333984375, -18.0869140625, -16.83984375, -15.5927734375, -14.345703125, -13.0986328125, -11.8515625, -10.6044921875, -9.357421875, -8.1103515625, -6.86328125, -5.6162109375, -4.369140625, -3.1220703125, -1.875, -0.6279296875, 0.619140625, 1.8662109375, 3.11328125, 4.3603515625, 5.607421875, 6.8544921875, 8.1015625, 9.3486328125, 10.595703125, 11.8427734375, 13.08984375, 14.3369140625, 15.583984375, 16.8310546875, 18.078125, 19.3251953125, 20.572265625, 21.8193359375, 23.06640625, 24.3134765625, 25.560546875, 26.8076171875, 28.0546875, 29.3017578125, 30.548828125, 31.7958984375, 33.04296875, 34.2900390625, 35.537109375, 36.7841796875, 38.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 12.0, 9.0, 22.0, 41.0, 58.0, 88.0, 121.0, 166.0, 130.0, 108.0, 70.0, 56.0, 34.0, 19.0, 18.0, 11.0, 8.0, 3.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-98.1707992553711, -95.26211547851562, -92.35343170166016, -89.44474792480469, -86.53606414794922, -83.62738037109375, -80.71870422363281, -77.81002044677734, -74.90133666992188, -71.9926528930664, -69.08396911621094, -66.17528533935547, -63.266605377197266, -60.3579216003418, -57.44923782348633, -54.540557861328125, -51.63187026977539, -48.72318649291992, -45.81450271606445, -42.90582275390625, -39.99713897705078, -37.08845520019531, -34.179771423339844, -31.271089553833008, -28.36240577697754, -25.45372200012207, -22.545040130615234, -19.636356353759766, -16.727672576904297, -13.818990707397461, -10.910306930541992, -8.001625061035156, -5.0929412841796875, -2.184258222579956, 0.7244248390197754, 3.633108139038086, 6.541790962219238, 9.45047378540039, 12.35915756225586, 15.267839431762695, 18.176523208618164, 21.085206985473633, 23.99388885498047, 26.902572631835938, 29.811256408691406, 32.719940185546875, 35.628623962402344, 38.53730392456055, 41.445987701416016, 44.354671478271484, 47.26335525512695, 50.172035217285156, 53.080718994140625, 55.989402770996094, 58.89808654785156, 61.80677032470703, 64.7154541015625, 67.62413787841797, 70.53282165527344, 73.4415054321289, 76.35018920898438, 79.25886535644531, 82.16755676269531, 85.07623291015625, 87.98491668701172]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 5.0, 12.0, 7.0, 15.0, 14.0, 15.0, 21.0, 19.0, 30.0, 23.0, 18.0, 33.0, 31.0, 23.0, 27.0, 34.0, 42.0, 41.0, 59.0, 40.0, 34.0, 35.0, 42.0, 40.0, 34.0, 27.0, 32.0, 27.0, 28.0, 30.0, 26.0, 13.0, 15.0, 10.0, 11.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-57.083038330078125, -55.23347091674805, -53.38390350341797, -51.53433609008789, -49.68476867675781, -47.835201263427734, -45.985633850097656, -44.13606643676758, -42.2864990234375, -40.43693161010742, -38.587364196777344, -36.737796783447266, -34.88822937011719, -33.03866195678711, -31.18909454345703, -29.339527130126953, -27.489959716796875, -25.640392303466797, -23.79082489013672, -21.94125747680664, -20.091690063476562, -18.242122650146484, -16.392555236816406, -14.542987823486328, -12.69342041015625, -10.843852996826172, -8.994285583496094, -7.144718170166016, -5.2951507568359375, -3.4455833435058594, -1.5960159301757812, 0.2535514831542969, 2.103118896484375, 3.952686309814453, 5.802253723144531, 7.651821136474609, 9.501388549804688, 11.350955963134766, 13.200523376464844, 15.050090789794922, 16.899658203125, 18.749225616455078, 20.598793029785156, 22.448360443115234, 24.297927856445312, 26.14749526977539, 27.99706268310547, 29.846630096435547, 31.696197509765625, 33.5457649230957, 35.39533233642578, 37.24489974975586, 39.09446716308594, 40.944034576416016, 42.793601989746094, 44.64316940307617, 46.49273681640625, 48.34230422973633, 50.191871643066406, 52.041439056396484, 53.89100646972656, 55.74057388305664, 57.59014129638672, 59.4397087097168, 61.289276123046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 14.0, 23.0, 37.0, 53.0, 62.0, 98.0, 184.0, 288.0, 404.0, 588.0, 923.0, 1443.0, 2385.0, 3636.0, 5755.0, 9205.0, 14914.0, 24916.0, 42030.0, 72262.0, 126349.0, 231862.0, 219852.0, 119918.0, 69119.0, 39985.0, 24009.0, 14231.0, 8772.0, 5536.0, 3443.0, 2188.0, 1465.0, 862.0, 606.0, 399.0, 257.0, 146.0, 109.0, 75.0, 50.0, 24.0, 20.0, 13.0, 15.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.2003173828125, -0.19441795349121094, -0.18851852416992188, -0.1826190948486328, -0.17671966552734375, -0.1708202362060547, -0.16492080688476562, -0.15902137756347656, -0.1531219482421875, -0.14722251892089844, -0.14132308959960938, -0.1354236602783203, -0.12952423095703125, -0.12362480163574219, -0.11772537231445312, -0.11182594299316406, -0.105926513671875, -0.10002708435058594, -0.09412765502929688, -0.08822822570800781, -0.08232879638671875, -0.07642936706542969, -0.07052993774414062, -0.06463050842285156, -0.0587310791015625, -0.05283164978027344, -0.046932220458984375, -0.04103279113769531, -0.03513336181640625, -0.029233932495117188, -0.023334503173828125, -0.017435073852539062, -0.01153564453125, -0.0056362152099609375, 0.000263214111328125, 0.0061626434326171875, 0.01206207275390625, 0.017961502075195312, 0.023860931396484375, 0.029760360717773438, 0.0356597900390625, 0.04155921936035156, 0.047458648681640625, 0.05335807800292969, 0.05925750732421875, 0.06515693664550781, 0.07105636596679688, 0.07695579528808594, 0.082855224609375, 0.08875465393066406, 0.09465408325195312, 0.10055351257324219, 0.10645294189453125, 0.11235237121582031, 0.11825180053710938, 0.12415122985839844, 0.1300506591796875, 0.13595008850097656, 0.14184951782226562, 0.1477489471435547, 0.15364837646484375, 0.1595478057861328, 0.16544723510742188, 0.17134666442871094, 0.17724609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 10.0, 10.0, 10.0, 12.0, 11.0, 15.0, 23.0, 22.0, 20.0, 22.0, 32.0, 33.0, 35.0, 36.0, 33.0, 30.0, 45.0, 35.0, 33.0, 1061.0, 36.0, 48.0, 35.0, 38.0, 35.0, 35.0, 27.0, 31.0, 23.0, 25.0, 19.0, 26.0, 20.0, 20.0, 9.0, 5.0, 9.0, 9.0, 6.0, 4.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.13043212890625, -3.9835205078125, -3.83660888671875, -3.689697265625, -3.54278564453125, -3.3958740234375, -3.24896240234375, -3.10205078125, -2.95513916015625, -2.8082275390625, -2.66131591796875, -2.514404296875, -2.36749267578125, -2.2205810546875, -2.07366943359375, -1.9267578125, -1.77984619140625, -1.6329345703125, -1.48602294921875, -1.339111328125, -1.19219970703125, -1.0452880859375, -0.89837646484375, -0.75146484375, -0.60455322265625, -0.4576416015625, -0.31072998046875, -0.163818359375, -0.01690673828125, 0.1300048828125, 0.27691650390625, 0.423828125, 0.57073974609375, 0.7176513671875, 0.86456298828125, 1.011474609375, 1.15838623046875, 1.3052978515625, 1.45220947265625, 1.59912109375, 1.74603271484375, 1.8929443359375, 2.03985595703125, 2.186767578125, 2.33367919921875, 2.4805908203125, 2.62750244140625, 2.7744140625, 2.92132568359375, 3.0682373046875, 3.21514892578125, 3.362060546875, 3.50897216796875, 3.6558837890625, 3.80279541015625, 3.94970703125, 4.09661865234375, 4.2435302734375, 4.39044189453125, 4.537353515625, 4.68426513671875, 4.8311767578125, 4.97808837890625, 5.125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 13.0, 18.0, 26.0, 25.0, 60.0, 78.0, 111.0, 164.0, 264.0, 365.0, 504.0, 735.0, 1056.0, 1402.0, 2032.0, 3114.0, 4511.0, 6592.0, 9780.0, 14151.0, 20706.0, 30248.0, 45080.0, 67141.0, 100897.0, 152353.0, 1234573.0, 132065.0, 87679.0, 58175.0, 38976.0, 26663.0, 18272.0, 12224.0, 8459.0, 5728.0, 4027.0, 2795.0, 1886.0, 1312.0, 866.0, 627.0, 429.0, 303.0, 210.0, 138.0, 104.0, 60.0, 50.0, 40.0, 17.0, 12.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.06927490234375, -0.0670633316040039, -0.06485176086425781, -0.06264019012451172, -0.060428619384765625, -0.05821704864501953, -0.05600547790527344, -0.053793907165527344, -0.05158233642578125, -0.049370765686035156, -0.04715919494628906, -0.04494762420654297, -0.042736053466796875, -0.04052448272705078, -0.03831291198730469, -0.036101341247558594, -0.0338897705078125, -0.031678199768066406, -0.029466629028320312, -0.02725505828857422, -0.025043487548828125, -0.02283191680908203, -0.020620346069335938, -0.018408775329589844, -0.01619720458984375, -0.013985633850097656, -0.011774063110351562, -0.009562492370605469, -0.007350921630859375, -0.005139350891113281, -0.0029277801513671875, -0.0007162094116210938, 0.001495361328125, 0.0037069320678710938, 0.0059185028076171875, 0.008130073547363281, 0.010341644287109375, 0.012553215026855469, 0.014764785766601562, 0.016976356506347656, 0.01918792724609375, 0.021399497985839844, 0.023611068725585938, 0.02582263946533203, 0.028034210205078125, 0.03024578094482422, 0.03245735168457031, 0.034668922424316406, 0.0368804931640625, 0.039092063903808594, 0.04130363464355469, 0.04351520538330078, 0.045726776123046875, 0.04793834686279297, 0.05014991760253906, 0.052361488342285156, 0.05457305908203125, 0.056784629821777344, 0.05899620056152344, 0.06120777130126953, 0.06341934204101562, 0.06563091278076172, 0.06784248352050781, 0.0700540542602539, 0.072265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 9.0, 10.0, 9.0, 14.0, 24.0, 33.0, 35.0, 44.0, 40.0, 46.0, 63.0, 65.0, 56.0, 62.0, 55.0, 50.0, 51.0, 58.0, 54.0, 35.0, 31.0, 29.0, 23.0, 20.0, 17.0, 16.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.00029597803950309753, -0.0002858266234397888, -0.0002756752073764801, -0.0002655237913131714, -0.00025537237524986267, -0.00024522095918655396, -0.00023506954312324524, -0.00022491812705993652, -0.0002147667109966278, -0.0002046152949333191, -0.00019446387887001038, -0.00018431246280670166, -0.00017416104674339294, -0.00016400963068008423, -0.0001538582146167755, -0.0001437067985534668, -0.00013355538249015808, -0.00012340396642684937, -0.00011325255036354065, -0.00010310113430023193, -9.294971823692322e-05, -8.27983021736145e-05, -7.264688611030579e-05, -6.249547004699707e-05, -5.2344053983688354e-05, -4.219263792037964e-05, -3.204122185707092e-05, -2.1889805793762207e-05, -1.1738389730453491e-05, -1.5869736671447754e-06, 8.56444239616394e-06, 1.8715858459472656e-05, 2.8867274522781372e-05, 3.901869058609009e-05, 4.9170106649398804e-05, 5.932152271270752e-05, 6.947293877601624e-05, 7.962435483932495e-05, 8.977577090263367e-05, 9.992718696594238e-05, 0.0001100786030292511, 0.00012023001909255981, 0.00013038143515586853, 0.00014053285121917725, 0.00015068426728248596, 0.00016083568334579468, 0.0001709870994091034, 0.0001811385154724121, 0.00019128993153572083, 0.00020144134759902954, 0.00021159276366233826, 0.00022174417972564697, 0.0002318955957889557, 0.0002420470118522644, 0.0002521984279155731, 0.00026234984397888184, 0.00027250126004219055, 0.00028265267610549927, 0.000292804092168808, 0.0003029555082321167, 0.0003131069242954254, 0.00032325834035873413, 0.00033340975642204285, 0.00034356117248535156]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 13.0, 15.0, 30.0, 41.0, 53.0, 66.0, 80.0, 137.0, 179.0, 239.0, 325.0, 660.0, 6876.0, 1008033.0, 29512.0, 853.0, 404.0, 260.0, 190.0, 162.0, 105.0, 90.0, 64.0, 33.0, 32.0, 22.0, 19.0, 11.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00583648681640625, -0.005662977695465088, -0.005489468574523926, -0.005315959453582764, -0.0051424503326416016, -0.0049689412117004395, -0.004795432090759277, -0.004621922969818115, -0.004448413848876953, -0.004274904727935791, -0.004101395606994629, -0.003927886486053467, -0.0037543773651123047, -0.0035808682441711426, -0.0034073591232299805, -0.0032338500022888184, -0.0030603408813476562, -0.002886831760406494, -0.002713322639465332, -0.00253981351852417, -0.002366304397583008, -0.0021927952766418457, -0.0020192861557006836, -0.0018457770347595215, -0.0016722679138183594, -0.0014987587928771973, -0.0013252496719360352, -0.001151740550994873, -0.000978231430053711, -0.0008047223091125488, -0.0006312131881713867, -0.0004577040672302246, -0.0002841949462890625, -0.00011068582534790039, 6.282329559326172e-05, 0.00023633241653442383, 0.00040984153747558594, 0.000583350658416748, 0.0007568597793579102, 0.0009303689002990723, 0.0011038780212402344, 0.0012773871421813965, 0.0014508962631225586, 0.0016244053840637207, 0.0017979145050048828, 0.001971423625946045, 0.002144932746887207, 0.002318441867828369, 0.0024919509887695312, 0.0026654601097106934, 0.0028389692306518555, 0.0030124783515930176, 0.0031859874725341797, 0.003359496593475342, 0.003533005714416504, 0.003706514835357666, 0.003880023956298828, 0.00405353307723999, 0.004227042198181152, 0.0044005513191223145, 0.0045740604400634766, 0.004747569561004639, 0.004921078681945801, 0.005094587802886963, 0.005268096923828125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 24.0, 515.0, 450.0, 22.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032828235998749733, -0.0032251852098852396, -0.003167546819895506, -0.0031099081970751286, -0.003052269807085395, -0.002994631417095661, -0.0029369930271059275, -0.0028793546371161938, -0.00282171624712646, -0.0027640778571367264, -0.0027064394671469927, -0.002648801077157259, -0.0025911624543368816, -0.002533524064347148, -0.0024758856743574142, -0.0024182472843676805, -0.002360608661547303, -0.0023029702715575695, -0.002245331881567836, -0.002187693491578102, -0.0021300548687577248, -0.002072416478767991, -0.0020147780887782574, -0.0019571396987885237, -0.00189950130879879, -0.0018418629188090563, -0.0017842244124040008, -0.001726586022414267, -0.0016689476324245334, -0.0016113091260194778, -0.0015536707360297441, -0.0014960323460400105, -0.0014383939560502768, -0.001380755566060543, -0.0013231170596554875, -0.0012654786696657538, -0.0012078402796760201, -0.0011502017732709646, -0.001092563383281231, -0.0010349249932914972, -0.0009772864868864417, -0.0009196480386890471, -0.0008620096486993134, -0.0008043712005019188, -0.0007467327523045242, -0.0006890943041071296, -0.0006314559141173959, -0.0005738174659200013, -0.0005161790177226067, -0.0004585405986290425, -0.0004009021504316479, -0.00034326373133808374, -0.00028562528314068913, -0.00022798686404712498, -0.00017034844495356083, -0.00011270999675616622, -5.507157766260207e-05, 2.566852344898507e-06, 6.020528235239908e-05, 0.00011784370872192085, 0.00017548214236740023, 0.0002331205760128796, 0.00029075899510644376, 0.00034839744330383837, 0.0004060358623974025]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 10.0, 24.0, 20.0, 20.0, 23.0, 30.0, 31.0, 33.0, 27.0, 49.0, 46.0, 41.0, 59.0, 48.0, 40.0, 48.0, 42.0, 41.0, 44.0, 32.0, 38.0, 27.0, 32.0, 26.0, 31.0, 21.0, 16.0, 14.0, 12.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0002675056457519531, -0.0002597291022539139, -0.00025195255875587463, -0.0002441760152578354, -0.00023639947175979614, -0.0002286229282617569, -0.00022084638476371765, -0.0002130698412656784, -0.00020529329776763916, -0.00019751675426959991, -0.00018974021077156067, -0.00018196366727352142, -0.00017418712377548218, -0.00016641058027744293, -0.0001586340367794037, -0.00015085749328136444, -0.0001430809497833252, -0.00013530440628528595, -0.0001275278627872467, -0.00011975131928920746, -0.00011197477579116821, -0.00010419823229312897, -9.642168879508972e-05, -8.864514529705048e-05, -8.086860179901123e-05, -7.309205830097198e-05, -6.531551480293274e-05, -5.7538971304893494e-05, -4.976242780685425e-05, -4.1985884308815e-05, -3.420934081077576e-05, -2.643279731273651e-05, -1.8656253814697266e-05, -1.087971031665802e-05, -3.1031668186187744e-06, 4.673376679420471e-06, 1.2449920177459717e-05, 2.0226463675498962e-05, 2.8003007173538208e-05, 3.5779550671577454e-05, 4.35560941696167e-05, 5.1332637667655945e-05, 5.910918116569519e-05, 6.688572466373444e-05, 7.466226816177368e-05, 8.243881165981293e-05, 9.021535515785217e-05, 9.799189865589142e-05, 0.00010576844215393066, 0.00011354498565196991, 0.00012132152915000916, 0.0001290980726480484, 0.00013687461614608765, 0.0001446511596441269, 0.00015242770314216614, 0.00016020424664020538, 0.00016798079013824463, 0.00017575733363628387, 0.00018353387713432312, 0.00019131042063236237, 0.0001990869641304016, 0.00020686350762844086, 0.0002146400511264801, 0.00022241659462451935, 0.0002301931381225586]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 11.0, 12.0, 6.0, 23.0, 18.0, 25.0, 27.0, 39.0, 51.0, 67.0, 114.0, 170.0, 277.0, 453.0, 729.0, 1187.0, 2020.0, 3901.0, 8089.0, 22896.0, 163588.0, 771201.0, 48504.0, 12944.0, 5415.0, 2725.0, 1526.0, 908.0, 564.0, 344.0, 219.0, 153.0, 101.0, 71.0, 45.0, 38.0, 23.0, 10.0, 12.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.96875, -25.080810546875, -24.19287109375, -23.304931640625, -22.4169921875, -21.529052734375, -20.64111328125, -19.753173828125, -18.865234375, -17.977294921875, -17.08935546875, -16.201416015625, -15.3134765625, -14.425537109375, -13.53759765625, -12.649658203125, -11.76171875, -10.873779296875, -9.98583984375, -9.097900390625, -8.2099609375, -7.322021484375, -6.43408203125, -5.546142578125, -4.658203125, -3.770263671875, -2.88232421875, -1.994384765625, -1.1064453125, -0.218505859375, 0.66943359375, 1.557373046875, 2.4453125, 3.333251953125, 4.22119140625, 5.109130859375, 5.9970703125, 6.885009765625, 7.77294921875, 8.660888671875, 9.548828125, 10.436767578125, 11.32470703125, 12.212646484375, 13.1005859375, 13.988525390625, 14.87646484375, 15.764404296875, 16.65234375, 17.540283203125, 18.42822265625, 19.316162109375, 20.2041015625, 21.092041015625, 21.97998046875, 22.867919921875, 23.755859375, 24.643798828125, 25.53173828125, 26.419677734375, 27.3076171875, 28.195556640625, 29.08349609375, 29.971435546875, 30.859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 15.0, 19.0, 21.0, 28.0, 33.0, 38.0, 44.0, 38.0, 34.0, 54.0, 86.0, 147.0, 1565.0, 315.0, 114.0, 68.0, 53.0, 32.0, 45.0, 28.0, 35.0, 36.0, 27.0, 18.0, 23.0, 22.0, 12.0, 6.0, 16.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-28.5625, -27.63525390625, -26.7080078125, -25.78076171875, -24.853515625, -23.92626953125, -22.9990234375, -22.07177734375, -21.14453125, -20.21728515625, -19.2900390625, -18.36279296875, -17.435546875, -16.50830078125, -15.5810546875, -14.65380859375, -13.7265625, -12.79931640625, -11.8720703125, -10.94482421875, -10.017578125, -9.09033203125, -8.1630859375, -7.23583984375, -6.30859375, -5.38134765625, -4.4541015625, -3.52685546875, -2.599609375, -1.67236328125, -0.7451171875, 0.18212890625, 1.109375, 2.03662109375, 2.9638671875, 3.89111328125, 4.818359375, 5.74560546875, 6.6728515625, 7.60009765625, 8.52734375, 9.45458984375, 10.3818359375, 11.30908203125, 12.236328125, 13.16357421875, 14.0908203125, 15.01806640625, 15.9453125, 16.87255859375, 17.7998046875, 18.72705078125, 19.654296875, 20.58154296875, 21.5087890625, 22.43603515625, 23.36328125, 24.29052734375, 25.2177734375, 26.14501953125, 27.072265625, 27.99951171875, 28.9267578125, 29.85400390625, 30.78125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 11.0, 5.0, 11.0, 18.0, 30.0, 32.0, 38.0, 58.0, 85.0, 129.0, 235.0, 521.0, 1173.0, 3109.0, 10721.0, 75919.0, 2939636.0, 96013.0, 12091.0, 3410.0, 1270.0, 506.0, 249.0, 133.0, 77.0, 61.0, 45.0, 27.0, 19.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.53125, -48.09716796875, -46.6630859375, -45.22900390625, -43.794921875, -42.36083984375, -40.9267578125, -39.49267578125, -38.05859375, -36.62451171875, -35.1904296875, -33.75634765625, -32.322265625, -30.88818359375, -29.4541015625, -28.02001953125, -26.5859375, -25.15185546875, -23.7177734375, -22.28369140625, -20.849609375, -19.41552734375, -17.9814453125, -16.54736328125, -15.11328125, -13.67919921875, -12.2451171875, -10.81103515625, -9.376953125, -7.94287109375, -6.5087890625, -5.07470703125, -3.640625, -2.20654296875, -0.7724609375, 0.66162109375, 2.095703125, 3.52978515625, 4.9638671875, 6.39794921875, 7.83203125, 9.26611328125, 10.7001953125, 12.13427734375, 13.568359375, 15.00244140625, 16.4365234375, 17.87060546875, 19.3046875, 20.73876953125, 22.1728515625, 23.60693359375, 25.041015625, 26.47509765625, 27.9091796875, 29.34326171875, 30.77734375, 32.21142578125, 33.6455078125, 35.07958984375, 36.513671875, 37.94775390625, 39.3818359375, 40.81591796875, 42.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 153.0, 563.0, 222.0, 39.0, 10.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.226104736328125, -21.176929473876953, -13.127754211425781, -5.078578948974609, 2.9705963134765625, 11.019771575927734, 19.068946838378906, 27.118122100830078, 35.16729736328125, 43.21647262573242, 51.265647888183594, 59.314823150634766, 67.36399841308594, 75.41317749023438, 83.46234893798828, 91.51152038574219, 99.56069946289062, 107.60987854003906, 115.65904998779297, 123.70822143554688, 131.7574005126953, 139.80657958984375, 147.85574340820312, 155.90492248535156, 163.9541015625, 172.00328063964844, 180.05245971679688, 188.10162353515625, 196.1508026123047, 204.19998168945312, 212.2491455078125, 220.29832458496094, 228.3475341796875, 236.39671325683594, 244.44589233398438, 252.49505615234375, 260.54425048828125, 268.5934143066406, 276.642578125, 284.6917724609375, 292.7409362792969, 300.79010009765625, 308.83929443359375, 316.8884582519531, 324.9376220703125, 332.98681640625, 341.0359802246094, 349.0851745605469, 357.13433837890625, 365.1835021972656, 373.2326965332031, 381.2818603515625, 389.3310546875, 397.3802185058594, 405.42938232421875, 413.47857666015625, 421.5277404785156, 429.576904296875, 437.6260986328125, 445.6752624511719, 453.72442626953125, 461.77362060546875, 469.8227844238281, 477.8719787597656, 485.921142578125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 9.0, 16.0, 7.0, 17.0, 14.0, 20.0, 29.0, 26.0, 28.0, 27.0, 22.0, 40.0, 33.0, 33.0, 43.0, 35.0, 41.0, 43.0, 44.0, 50.0, 40.0, 40.0, 37.0, 36.0, 37.0, 34.0, 36.0, 33.0, 12.0, 17.0, 13.0, 14.0, 11.0, 16.0, 4.0, 11.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.70098876953125, -87.95838928222656, -85.21578979492188, -82.47319030761719, -79.7305908203125, -76.98799133300781, -74.24539184570312, -71.5027847290039, -68.76018524169922, -66.01758575439453, -63.274986267089844, -60.532386779785156, -57.7897834777832, -55.047183990478516, -52.30458450317383, -49.561981201171875, -46.81938552856445, -44.076786041259766, -41.33418655395508, -38.591583251953125, -35.84898376464844, -33.10638427734375, -30.363784790039062, -27.621183395385742, -24.878583908081055, -22.135984420776367, -19.393383026123047, -16.65078353881836, -13.908183097839355, -11.165582656860352, -8.422983169555664, -5.680381774902344, -2.9377822875976562, -0.19518208503723145, 2.5474181175231934, 5.290018081665039, 8.032618522644043, 10.775218963623047, 13.517818450927734, 16.260419845581055, 19.003019332885742, 21.74561882019043, 24.48822021484375, 27.230819702148438, 29.973419189453125, 32.71601867675781, 35.4586181640625, 38.20122146606445, 40.94382095336914, 43.68642044067383, 46.429019927978516, 49.17162322998047, 51.914222717285156, 54.656822204589844, 57.39942169189453, 60.14202117919922, 62.884620666503906, 65.6272201538086, 68.36981964111328, 71.11241912841797, 73.85501861572266, 76.59762573242188, 79.34022521972656, 82.08282470703125, 84.82542419433594]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 11.0, 13.0, 14.0, 33.0, 19.0, 19.0, 30.0, 31.0, 36.0, 46.0, 32.0, 47.0, 39.0, 43.0, 56.0, 55.0, 42.0, 48.0, 45.0, 36.0, 39.0, 35.0, 29.0, 29.0, 23.0, 18.0, 15.0, 20.0, 8.0, 12.0, 8.0, 6.0, 3.0, 12.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.9921875, -9.7122802734375, -9.432373046875, -9.1524658203125, -8.87255859375, -8.5926513671875, -8.312744140625, -8.0328369140625, -7.7529296875, -7.4730224609375, -7.193115234375, -6.9132080078125, -6.63330078125, -6.3533935546875, -6.073486328125, -5.7935791015625, -5.513671875, -5.2337646484375, -4.953857421875, -4.6739501953125, -4.39404296875, -4.1141357421875, -3.834228515625, -3.5543212890625, -3.2744140625, -2.9945068359375, -2.714599609375, -2.4346923828125, -2.15478515625, -1.8748779296875, -1.594970703125, -1.3150634765625, -1.03515625, -0.7552490234375, -0.475341796875, -0.1954345703125, 0.08447265625, 0.3643798828125, 0.644287109375, 0.9241943359375, 1.2041015625, 1.4840087890625, 1.763916015625, 2.0438232421875, 2.32373046875, 2.6036376953125, 2.883544921875, 3.1634521484375, 3.443359375, 3.7232666015625, 4.003173828125, 4.2830810546875, 4.56298828125, 4.8428955078125, 5.122802734375, 5.4027099609375, 5.6826171875, 5.9625244140625, 6.242431640625, 6.5223388671875, 6.80224609375, 7.0821533203125, 7.362060546875, 7.6419677734375, 7.921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 6.0, 8.0, 15.0, 17.0, 27.0, 30.0, 62.0, 69.0, 80.0, 126.0, 168.0, 243.0, 354.0, 519.0, 825.0, 1268.0, 2129.0, 3388.0, 6329.0, 13207.0, 46986.0, 471690.0, 2929203.0, 622923.0, 62956.0, 14921.0, 7000.0, 3668.0, 2220.0, 1325.0, 771.0, 582.0, 384.0, 243.0, 172.0, 108.0, 75.0, 65.0, 32.0, 25.0, 15.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-23.328125, -22.68994140625, -22.0517578125, -21.41357421875, -20.775390625, -20.13720703125, -19.4990234375, -18.86083984375, -18.22265625, -17.58447265625, -16.9462890625, -16.30810546875, -15.669921875, -15.03173828125, -14.3935546875, -13.75537109375, -13.1171875, -12.47900390625, -11.8408203125, -11.20263671875, -10.564453125, -9.92626953125, -9.2880859375, -8.64990234375, -8.01171875, -7.37353515625, -6.7353515625, -6.09716796875, -5.458984375, -4.82080078125, -4.1826171875, -3.54443359375, -2.90625, -2.26806640625, -1.6298828125, -0.99169921875, -0.353515625, 0.28466796875, 0.9228515625, 1.56103515625, 2.19921875, 2.83740234375, 3.4755859375, 4.11376953125, 4.751953125, 5.39013671875, 6.0283203125, 6.66650390625, 7.3046875, 7.94287109375, 8.5810546875, 9.21923828125, 9.857421875, 10.49560546875, 11.1337890625, 11.77197265625, 12.41015625, 13.04833984375, 13.6865234375, 14.32470703125, 14.962890625, 15.60107421875, 16.2392578125, 16.87744140625, 17.515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 21.0, 19.0, 26.0, 38.0, 44.0, 61.0, 97.0, 172.0, 361.0, 688.0, 888.0, 653.0, 394.0, 191.0, 113.0, 57.0, 39.0, 39.0, 21.0, 28.0, 13.0, 11.0, 12.0, 8.0, 10.0, 5.0, 2.0, 8.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.270263671875, -24.49365234375, -23.717041015625, -22.9404296875, -22.163818359375, -21.38720703125, -20.610595703125, -19.833984375, -19.057373046875, -18.28076171875, -17.504150390625, -16.7275390625, -15.950927734375, -15.17431640625, -14.397705078125, -13.62109375, -12.844482421875, -12.06787109375, -11.291259765625, -10.5146484375, -9.738037109375, -8.96142578125, -8.184814453125, -7.408203125, -6.631591796875, -5.85498046875, -5.078369140625, -4.3017578125, -3.525146484375, -2.74853515625, -1.971923828125, -1.1953125, -0.418701171875, 0.35791015625, 1.134521484375, 1.9111328125, 2.687744140625, 3.46435546875, 4.240966796875, 5.017578125, 5.794189453125, 6.57080078125, 7.347412109375, 8.1240234375, 8.900634765625, 9.67724609375, 10.453857421875, 11.23046875, 12.007080078125, 12.78369140625, 13.560302734375, 14.3369140625, 15.113525390625, 15.89013671875, 16.666748046875, 17.443359375, 18.219970703125, 18.99658203125, 19.773193359375, 20.5498046875, 21.326416015625, 22.10302734375, 22.879638671875, 23.65625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 27.0, 23.0, 35.0, 56.0, 67.0, 121.0, 164.0, 235.0, 450.0, 669.0, 1146.0, 1891.0, 3316.0, 6232.0, 12220.0, 27491.0, 79096.0, 563008.0, 3055936.0, 333827.0, 61755.0, 23047.0, 10693.0, 5328.0, 2979.0, 1704.0, 968.0, 596.0, 421.0, 259.0, 182.0, 96.0, 68.0, 48.0, 26.0, 22.0, 18.0, 13.0, 13.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.484375, -23.678955078125, -22.87353515625, -22.068115234375, -21.2626953125, -20.457275390625, -19.65185546875, -18.846435546875, -18.041015625, -17.235595703125, -16.43017578125, -15.624755859375, -14.8193359375, -14.013916015625, -13.20849609375, -12.403076171875, -11.59765625, -10.792236328125, -9.98681640625, -9.181396484375, -8.3759765625, -7.570556640625, -6.76513671875, -5.959716796875, -5.154296875, -4.348876953125, -3.54345703125, -2.738037109375, -1.9326171875, -1.127197265625, -0.32177734375, 0.483642578125, 1.2890625, 2.094482421875, 2.89990234375, 3.705322265625, 4.5107421875, 5.316162109375, 6.12158203125, 6.927001953125, 7.732421875, 8.537841796875, 9.34326171875, 10.148681640625, 10.9541015625, 11.759521484375, 12.56494140625, 13.370361328125, 14.17578125, 14.981201171875, 15.78662109375, 16.592041015625, 17.3974609375, 18.202880859375, 19.00830078125, 19.813720703125, 20.619140625, 21.424560546875, 22.22998046875, 23.035400390625, 23.8408203125, 24.646240234375, 25.45166015625, 26.257080078125, 27.0625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 35.0, 91.0, 262.0, 384.0, 162.0, 47.0, 16.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.69752502441406, -81.86127471923828, -73.02503204345703, -64.18878173828125, -55.352535247802734, -46.51628875732422, -37.68003845214844, -28.843791961669922, -20.007545471191406, -11.171298027038574, -2.335050582885742, 6.501197814941406, 15.337444305419922, 24.173690795898438, 33.00994110107422, 41.846187591552734, 50.68243408203125, 59.518680572509766, 68.35492706298828, 77.19117736816406, 86.02742004394531, 94.8636703491211, 103.69992065429688, 112.53616333007812, 121.3724136352539, 130.2086639404297, 139.04490661621094, 147.88116455078125, 156.7174072265625, 165.55364990234375, 174.389892578125, 183.2261505126953, 192.06240844726562, 200.89865112304688, 209.7349090576172, 218.57115173339844, 227.4073944091797, 236.24365234375, 245.07989501953125, 253.9161376953125, 262.75238037109375, 271.588623046875, 280.42486572265625, 289.2611083984375, 298.0973815917969, 306.9336242675781, 315.7698669433594, 324.6061096191406, 333.4423828125, 342.27862548828125, 351.1148681640625, 359.95111083984375, 368.7873840332031, 377.6236267089844, 386.4598693847656, 395.2961120605469, 404.1323547363281, 412.9685974121094, 421.8048400878906, 430.64111328125, 439.47735595703125, 448.3135986328125, 457.14984130859375, 465.986083984375, 474.82232666015625]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 7.0, 8.0, 14.0, 11.0, 21.0, 20.0, 16.0, 22.0, 28.0, 28.0, 30.0, 33.0, 44.0, 39.0, 36.0, 40.0, 44.0, 35.0, 41.0, 33.0, 46.0, 37.0, 33.0, 41.0, 28.0, 34.0, 25.0, 34.0, 23.0, 23.0, 25.0, 18.0, 7.0, 11.0, 5.0, 13.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.72080993652344, -66.65535736083984, -64.58990478515625, -62.52445983886719, -60.459007263183594, -58.3935546875, -56.32810592651367, -54.262657165527344, -52.19720458984375, -50.131752014160156, -48.06630325317383, -46.0008544921875, -43.935401916503906, -41.86994934082031, -39.804500579833984, -37.739051818847656, -35.67359924316406, -33.60814666748047, -31.54269790649414, -29.47724723815918, -27.41179656982422, -25.346345901489258, -23.280895233154297, -21.215444564819336, -19.149993896484375, -17.084543228149414, -15.019092559814453, -12.953641891479492, -10.888191223144531, -8.82274055480957, -6.757289886474609, -4.691839218139648, -2.6263885498046875, -0.5609378814697266, 1.5045127868652344, 3.5699634552001953, 5.635414123535156, 7.700864791870117, 9.766315460205078, 11.831766128540039, 13.897216796875, 15.962667465209961, 18.028118133544922, 20.093568801879883, 22.159019470214844, 24.224470138549805, 26.289920806884766, 28.355371475219727, 30.420822143554688, 32.48627471923828, 34.55172348022461, 36.61717224121094, 38.68262481689453, 40.748077392578125, 42.81352615356445, 44.87897491455078, 46.944427490234375, 49.00988006591797, 51.0753288269043, 53.140777587890625, 55.20623016357422, 57.27168273925781, 59.33713150024414, 61.40258026123047, 63.46803283691406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 21.0, 25.0, 47.0, 53.0, 105.0, 137.0, 198.0, 228.0, 347.0, 453.0, 694.0, 941.0, 1414.0, 2069.0, 3031.0, 4375.0, 6617.0, 9942.0, 15281.0, 23662.0, 37226.0, 59597.0, 96489.0, 158861.0, 222728.0, 151581.0, 92177.0, 56968.0, 35597.0, 22982.0, 14834.0, 9638.0, 6352.0, 4185.0, 2967.0, 2014.0, 1423.0, 1015.0, 695.0, 458.0, 341.0, 241.0, 164.0, 117.0, 65.0, 59.0, 33.0, 27.0, 17.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0], "bins": [-0.1878662109375, -0.1822509765625, -0.1766357421875, -0.1710205078125, -0.1654052734375, -0.1597900390625, -0.1541748046875, -0.1485595703125, -0.1429443359375, -0.1373291015625, -0.1317138671875, -0.1260986328125, -0.1204833984375, -0.1148681640625, -0.1092529296875, -0.1036376953125, -0.0980224609375, -0.0924072265625, -0.0867919921875, -0.0811767578125, -0.0755615234375, -0.0699462890625, -0.0643310546875, -0.0587158203125, -0.0531005859375, -0.0474853515625, -0.0418701171875, -0.0362548828125, -0.0306396484375, -0.0250244140625, -0.0194091796875, -0.0137939453125, -0.0081787109375, -0.0025634765625, 0.0030517578125, 0.0086669921875, 0.0142822265625, 0.0198974609375, 0.0255126953125, 0.0311279296875, 0.0367431640625, 0.0423583984375, 0.0479736328125, 0.0535888671875, 0.0592041015625, 0.0648193359375, 0.0704345703125, 0.0760498046875, 0.0816650390625, 0.0872802734375, 0.0928955078125, 0.0985107421875, 0.1041259765625, 0.1097412109375, 0.1153564453125, 0.1209716796875, 0.1265869140625, 0.1322021484375, 0.1378173828125, 0.1434326171875, 0.1490478515625, 0.1546630859375, 0.1602783203125, 0.1658935546875, 0.1715087890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 16.0, 12.0, 14.0, 24.0, 17.0, 28.0, 28.0, 36.0, 27.0, 30.0, 31.0, 31.0, 31.0, 35.0, 35.0, 1070.0, 39.0, 27.0, 44.0, 28.0, 46.0, 42.0, 26.0, 31.0, 26.0, 29.0, 19.0, 16.0, 25.0, 14.0, 10.0, 17.0, 11.0, 14.0, 4.0, 14.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-5.1953125, -5.03619384765625, -4.8770751953125, -4.71795654296875, -4.558837890625, -4.39971923828125, -4.2406005859375, -4.08148193359375, -3.92236328125, -3.76324462890625, -3.6041259765625, -3.44500732421875, -3.285888671875, -3.12677001953125, -2.9676513671875, -2.80853271484375, -2.6494140625, -2.49029541015625, -2.3311767578125, -2.17205810546875, -2.012939453125, -1.85382080078125, -1.6947021484375, -1.53558349609375, -1.37646484375, -1.21734619140625, -1.0582275390625, -0.89910888671875, -0.739990234375, -0.58087158203125, -0.4217529296875, -0.26263427734375, -0.103515625, 0.05560302734375, 0.2147216796875, 0.37384033203125, 0.532958984375, 0.69207763671875, 0.8511962890625, 1.01031494140625, 1.16943359375, 1.32855224609375, 1.4876708984375, 1.64678955078125, 1.805908203125, 1.96502685546875, 2.1241455078125, 2.28326416015625, 2.4423828125, 2.60150146484375, 2.7606201171875, 2.91973876953125, 3.078857421875, 3.23797607421875, 3.3970947265625, 3.55621337890625, 3.71533203125, 3.87445068359375, 4.0335693359375, 4.19268798828125, 4.351806640625, 4.51092529296875, 4.6700439453125, 4.82916259765625, 4.98828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 9.0, 25.0, 38.0, 44.0, 83.0, 102.0, 144.0, 184.0, 316.0, 453.0, 682.0, 929.0, 1320.0, 1859.0, 2735.0, 4058.0, 5818.0, 8463.0, 12004.0, 17327.0, 24558.0, 35361.0, 50418.0, 72972.0, 107421.0, 165542.0, 1205452.0, 117356.0, 79724.0, 55293.0, 38362.0, 26893.0, 18773.0, 12894.0, 8941.0, 6372.0, 4322.0, 3013.0, 2126.0, 1457.0, 977.0, 686.0, 489.0, 362.0, 253.0, 153.0, 114.0, 80.0, 55.0, 37.0, 23.0, 11.0, 13.0, 7.0, 6.0, 6.0, 2.0, 1.0], "bins": [-0.07403564453125, -0.0717306137084961, -0.06942558288574219, -0.06712055206298828, -0.06481552124023438, -0.06251049041748047, -0.06020545959472656, -0.057900428771972656, -0.05559539794921875, -0.053290367126464844, -0.05098533630371094, -0.04868030548095703, -0.046375274658203125, -0.04407024383544922, -0.04176521301269531, -0.039460182189941406, -0.0371551513671875, -0.034850120544433594, -0.03254508972167969, -0.03024005889892578, -0.027935028076171875, -0.02562999725341797, -0.023324966430664062, -0.021019935607910156, -0.01871490478515625, -0.016409873962402344, -0.014104843139648438, -0.011799812316894531, -0.009494781494140625, -0.007189750671386719, -0.0048847198486328125, -0.0025796890258789062, -0.000274658203125, 0.0020303726196289062, 0.0043354034423828125, 0.006640434265136719, 0.008945465087890625, 0.011250495910644531, 0.013555526733398438, 0.015860557556152344, 0.01816558837890625, 0.020470619201660156, 0.022775650024414062, 0.02508068084716797, 0.027385711669921875, 0.02969074249267578, 0.03199577331542969, 0.034300804138183594, 0.0366058349609375, 0.038910865783691406, 0.04121589660644531, 0.04352092742919922, 0.045825958251953125, 0.04813098907470703, 0.05043601989746094, 0.052741050720214844, 0.05504608154296875, 0.057351112365722656, 0.05965614318847656, 0.06196117401123047, 0.06426620483398438, 0.06657123565673828, 0.06887626647949219, 0.0711812973022461, 0.073486328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 15.0, 14.0, 15.0, 16.0, 21.0, 23.0, 21.0, 36.0, 47.0, 50.0, 57.0, 60.0, 68.0, 62.0, 59.0, 59.0, 58.0, 52.0, 47.0, 43.0, 36.0, 20.0, 20.0, 19.0, 14.0, 15.0, 10.0, 6.0, 8.0, 4.0, 10.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008215904235839844, -0.0007985308766365051, -0.0007754713296890259, -0.0007524117827415466, -0.0007293522357940674, -0.0007062926888465881, -0.0006832331418991089, -0.0006601735949516296, -0.0006371140480041504, -0.0006140545010566711, -0.0005909949541091919, -0.0005679354071617126, -0.0005448758602142334, -0.0005218163132667542, -0.0004987567663192749, -0.00047569721937179565, -0.0004526376724243164, -0.00042957812547683716, -0.0004065185785293579, -0.00038345903158187866, -0.0003603994846343994, -0.00033733993768692017, -0.0003142803907394409, -0.00029122084379196167, -0.0002681612968444824, -0.0002451017498970032, -0.00022204220294952393, -0.00019898265600204468, -0.00017592310905456543, -0.00015286356210708618, -0.00012980401515960693, -0.00010674446821212769, -8.368492126464844e-05, -6.062537431716919e-05, -3.756582736968994e-05, -1.4506280422210693e-05, 8.553266525268555e-06, 3.16128134727478e-05, 5.467236042022705e-05, 7.77319073677063e-05, 0.00010079145431518555, 0.0001238510012626648, 0.00014691054821014404, 0.0001699700951576233, 0.00019302964210510254, 0.0002160891890525818, 0.00023914873600006104, 0.0002622082829475403, 0.00028526782989501953, 0.0003083273768424988, 0.00033138692378997803, 0.0003544464707374573, 0.0003775060176849365, 0.00040056556463241577, 0.000423625111579895, 0.00044668465852737427, 0.0004697442054748535, 0.0004928037524223328, 0.000515863299369812, 0.0005389228463172913, 0.0005619823932647705, 0.0005850419402122498, 0.000608101487159729, 0.0006311610341072083, 0.0006542205810546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 5.0, 9.0, 6.0, 15.0, 15.0, 15.0, 21.0, 41.0, 31.0, 60.0, 86.0, 140.0, 161.0, 229.0, 417.0, 1007.0, 26295.0, 1011221.0, 6912.0, 742.0, 356.0, 224.0, 150.0, 106.0, 76.0, 62.0, 42.0, 31.0, 25.0, 17.0, 18.0, 4.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01171112060546875, -0.011298298835754395, -0.010885477066040039, -0.010472655296325684, -0.010059833526611328, -0.009647011756896973, -0.009234189987182617, -0.008821368217468262, -0.008408546447753906, -0.00799572467803955, -0.007582902908325195, -0.00717008113861084, -0.006757259368896484, -0.006344437599182129, -0.0059316158294677734, -0.005518794059753418, -0.0051059722900390625, -0.004693150520324707, -0.0042803287506103516, -0.003867506980895996, -0.0034546852111816406, -0.003041863441467285, -0.0026290416717529297, -0.0022162199020385742, -0.0018033981323242188, -0.0013905763626098633, -0.0009777545928955078, -0.0005649328231811523, -0.00015211105346679688, 0.0002607107162475586, 0.0006735324859619141, 0.0010863542556762695, 0.001499176025390625, 0.0019119977951049805, 0.002324819564819336, 0.0027376413345336914, 0.003150463104248047, 0.0035632848739624023, 0.003976106643676758, 0.004388928413391113, 0.004801750183105469, 0.005214571952819824, 0.00562739372253418, 0.006040215492248535, 0.006453037261962891, 0.006865859031677246, 0.0072786808013916016, 0.007691502571105957, 0.008104324340820312, 0.008517146110534668, 0.008929967880249023, 0.009342789649963379, 0.009755611419677734, 0.01016843318939209, 0.010581254959106445, 0.0109940767288208, 0.011406898498535156, 0.011819720268249512, 0.012232542037963867, 0.012645363807678223, 0.013058185577392578, 0.013471007347106934, 0.013883829116821289, 0.014296650886535645, 0.01470947265625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 925.0, 84.0, 0.0, 1.0], "bins": [-0.025905147194862366, -0.025479130446910858, -0.02505311369895935, -0.024627096951007843, -0.024201078340411186, -0.02377506159245968, -0.02334904484450817, -0.022923028096556664, -0.022497011348605156, -0.02207099460065365, -0.02164497785270214, -0.021218961104750633, -0.020792942494153976, -0.02036692574620247, -0.01994090899825096, -0.019514892250299454, -0.019088875502347946, -0.01866285875439644, -0.01823684200644493, -0.017810825258493423, -0.017384806647896767, -0.01695878989994526, -0.01653277315199375, -0.016106756404042244, -0.015680739656090736, -0.015254722908139229, -0.014828705228865147, -0.014402688480913639, -0.013976671732962132, -0.01355065405368805, -0.013124637305736542, -0.012698620557785034, -0.012272601947188377, -0.01184658519923687, -0.011420567519962788, -0.01099455077201128, -0.010568534024059772, -0.01014251634478569, -0.009716499596834183, -0.009290482848882675, -0.008864466100931168, -0.00843844935297966, -0.008012431673705578, -0.00758641492575407, -0.007160398177802563, -0.006734380964189768, -0.006308363750576973, -0.005882347002625465, -0.005456330254673958, -0.005030313041061163, -0.004604296293109655, -0.0041782790794968605, -0.003752262331545353, -0.003326245117932558, -0.002900228137150407, -0.0024742111563682556, -0.0020481941755861044, -0.0016221771948039532, -0.001196160214021802, -0.0007701431168243289, -0.0003441261360421777, 8.189096115529537e-05, 0.0005079079419374466, 0.0009339249227195978, 0.001359941903501749]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 12.0, 8.0, 11.0, 20.0, 14.0, 41.0, 46.0, 60.0, 61.0, 74.0, 79.0, 85.0, 81.0, 68.0, 61.0, 64.0, 59.0, 39.0, 32.0, 27.0, 27.0, 15.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008486509323120117, -0.0008117500692605972, -0.0007748492062091827, -0.0007379483431577682, -0.0007010474801063538, -0.0006641466170549393, -0.0006272457540035248, -0.0005903448909521103, -0.0005534440279006958, -0.0005165431648492813, -0.0004796423017978668, -0.00044274143874645233, -0.00040584057569503784, -0.00036893971264362335, -0.00033203884959220886, -0.00029513798654079437, -0.0002582371234893799, -0.0002213362604379654, -0.0001844353973865509, -0.00014753453433513641, -0.00011063367128372192, -7.373280823230743e-05, -3.6831945180892944e-05, 6.891787052154541e-08, 3.6969780921936035e-05, 7.387064397335052e-05, 0.00011077150702476501, 0.0001476723700761795, 0.000184573233127594, 0.00022147409617900848, 0.000258374959230423, 0.00029527582228183746, 0.00033217668533325195, 0.00036907754838466644, 0.00040597841143608093, 0.0004428792744874954, 0.0004797801375389099, 0.0005166810005903244, 0.0005535818636417389, 0.0005904827266931534, 0.0006273835897445679, 0.0006642844527959824, 0.0007011853158473969, 0.0007380861788988113, 0.0007749870419502258, 0.0008118879050016403, 0.0008487887680530548, 0.0008856896311044693, 0.0009225904941558838, 0.0009594913572072983, 0.0009963922202587128, 0.0010332930833101273, 0.0010701939463615417, 0.0011070948094129562, 0.0011439956724643707, 0.0011808965355157852, 0.0012177973985671997, 0.0012546982616186142, 0.0012915991246700287, 0.0013284999877214432, 0.0013654008507728577, 0.0014023017138242722, 0.0014392025768756866, 0.0014761034399271011, 0.0015130043029785156]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 11.0, 2.0, 2.0, 9.0, 11.0, 7.0, 12.0, 22.0, 30.0, 54.0, 58.0, 74.0, 108.0, 144.0, 199.0, 315.0, 424.0, 593.0, 866.0, 1339.0, 2117.0, 3457.0, 5796.0, 11233.0, 25894.0, 183710.0, 739638.0, 39274.0, 14551.0, 7086.0, 4091.0, 2462.0, 1636.0, 1008.0, 668.0, 522.0, 348.0, 214.0, 159.0, 94.0, 94.0, 72.0, 48.0, 31.0, 16.0, 18.0, 16.0, 2.0, 9.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.765625, -17.135009765625, -16.50439453125, -15.873779296875, -15.2431640625, -14.612548828125, -13.98193359375, -13.351318359375, -12.720703125, -12.090087890625, -11.45947265625, -10.828857421875, -10.1982421875, -9.567626953125, -8.93701171875, -8.306396484375, -7.67578125, -7.045166015625, -6.41455078125, -5.783935546875, -5.1533203125, -4.522705078125, -3.89208984375, -3.261474609375, -2.630859375, -2.000244140625, -1.36962890625, -0.739013671875, -0.1083984375, 0.522216796875, 1.15283203125, 1.783447265625, 2.4140625, 3.044677734375, 3.67529296875, 4.305908203125, 4.9365234375, 5.567138671875, 6.19775390625, 6.828369140625, 7.458984375, 8.089599609375, 8.72021484375, 9.350830078125, 9.9814453125, 10.612060546875, 11.24267578125, 11.873291015625, 12.50390625, 13.134521484375, 13.76513671875, 14.395751953125, 15.0263671875, 15.656982421875, 16.28759765625, 16.918212890625, 17.548828125, 18.179443359375, 18.81005859375, 19.440673828125, 20.0712890625, 20.701904296875, 21.33251953125, 21.963134765625, 22.59375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 4.0, 10.0, 12.0, 12.0, 18.0, 19.0, 12.0, 16.0, 24.0, 32.0, 24.0, 33.0, 41.0, 47.0, 52.0, 63.0, 102.0, 195.0, 1676.0, 104.0, 85.0, 56.0, 51.0, 51.0, 41.0, 35.0, 32.0, 24.0, 30.0, 26.0, 17.0, 16.0, 16.0, 15.0, 13.0, 5.0, 7.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.785400390625, -25.89892578125, -25.012451171875, -24.1259765625, -23.239501953125, -22.35302734375, -21.466552734375, -20.580078125, -19.693603515625, -18.80712890625, -17.920654296875, -17.0341796875, -16.147705078125, -15.26123046875, -14.374755859375, -13.48828125, -12.601806640625, -11.71533203125, -10.828857421875, -9.9423828125, -9.055908203125, -8.16943359375, -7.282958984375, -6.396484375, -5.510009765625, -4.62353515625, -3.737060546875, -2.8505859375, -1.964111328125, -1.07763671875, -0.191162109375, 0.6953125, 1.581787109375, 2.46826171875, 3.354736328125, 4.2412109375, 5.127685546875, 6.01416015625, 6.900634765625, 7.787109375, 8.673583984375, 9.56005859375, 10.446533203125, 11.3330078125, 12.219482421875, 13.10595703125, 13.992431640625, 14.87890625, 15.765380859375, 16.65185546875, 17.538330078125, 18.4248046875, 19.311279296875, 20.19775390625, 21.084228515625, 21.970703125, 22.857177734375, 23.74365234375, 24.630126953125, 25.5166015625, 26.403076171875, 27.28955078125, 28.176025390625, 29.0625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 16.0, 17.0, 26.0, 38.0, 42.0, 51.0, 55.0, 95.0, 130.0, 190.0, 445.0, 1245.0, 5268.0, 31459.0, 2813722.0, 271290.0, 16682.0, 3204.0, 841.0, 291.0, 159.0, 95.0, 77.0, 64.0, 35.0, 20.0, 16.0, 15.0, 11.0, 15.0, 13.0, 8.0, 9.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0, -56.23388671875, -54.4677734375, -52.70166015625, -50.935546875, -49.16943359375, -47.4033203125, -45.63720703125, -43.87109375, -42.10498046875, -40.3388671875, -38.57275390625, -36.806640625, -35.04052734375, -33.2744140625, -31.50830078125, -29.7421875, -27.97607421875, -26.2099609375, -24.44384765625, -22.677734375, -20.91162109375, -19.1455078125, -17.37939453125, -15.61328125, -13.84716796875, -12.0810546875, -10.31494140625, -8.548828125, -6.78271484375, -5.0166015625, -3.25048828125, -1.484375, 0.28173828125, 2.0478515625, 3.81396484375, 5.580078125, 7.34619140625, 9.1123046875, 10.87841796875, 12.64453125, 14.41064453125, 16.1767578125, 17.94287109375, 19.708984375, 21.47509765625, 23.2412109375, 25.00732421875, 26.7734375, 28.53955078125, 30.3056640625, 32.07177734375, 33.837890625, 35.60400390625, 37.3701171875, 39.13623046875, 40.90234375, 42.66845703125, 44.4345703125, 46.20068359375, 47.966796875, 49.73291015625, 51.4990234375, 53.26513671875, 55.03125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 228.0, 721.0, 54.0, 3.0, 1.0, 1.0], "bins": [-819.880126953125, -806.0418090820312, -792.2034912109375, -778.3651733398438, -764.5269165039062, -750.6885986328125, -736.8502807617188, -723.011962890625, -709.1736450195312, -695.3353271484375, -681.4970092773438, -667.65869140625, -653.8204345703125, -639.9821166992188, -626.143798828125, -612.3054809570312, -598.4671630859375, -584.6288452148438, -570.79052734375, -556.9522094726562, -543.1139526367188, -529.275634765625, -515.4373168945312, -501.5989990234375, -487.7607116699219, -473.9223937988281, -460.0841064453125, -446.24578857421875, -432.407470703125, -418.56915283203125, -404.7308654785156, -390.8925476074219, -377.05419921875, -363.21588134765625, -349.3775939941406, -335.5392761230469, -321.7009582519531, -307.8626708984375, -294.02435302734375, -280.18603515625, -266.34771728515625, -252.50941467285156, -238.6710968017578, -224.83279418945312, -210.99447631835938, -197.1561737060547, -183.31787109375, -169.47955322265625, -155.64126586914062, -141.80296325683594, -127.96464538574219, -114.1263427734375, -100.28802490234375, -86.44972229003906, -72.61141204833984, -58.773101806640625, -44.934783935546875, -31.096473693847656, -17.25816535949707, -3.4198570251464844, 10.418453216552734, 24.256759643554688, 38.095069885253906, 51.933380126953125, 65.77169036865234]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 27.0, 18.0, 16.0, 21.0, 32.0, 36.0, 41.0, 29.0, 28.0, 37.0, 37.0, 37.0, 33.0, 47.0, 53.0, 40.0, 33.0, 42.0, 36.0, 33.0, 35.0, 32.0, 24.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 12.0, 10.0, 7.0, 5.0, 6.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.90670776367188, -73.55231475830078, -71.19792175292969, -68.84353637695312, -66.48914337158203, -64.13475036621094, -61.78036117553711, -59.42597198486328, -57.07157897949219, -54.717185974121094, -52.362796783447266, -50.00840759277344, -47.654014587402344, -45.29962158203125, -42.94523239135742, -40.590843200683594, -38.2364501953125, -35.882057189941406, -33.52766799926758, -31.173276901245117, -28.818885803222656, -26.464494705200195, -24.110103607177734, -21.755712509155273, -19.401321411132812, -17.04693031311035, -14.69253921508789, -12.33814811706543, -9.983757019042969, -7.629365921020508, -5.274974822998047, -2.920583724975586, -0.5661849975585938, 1.7882061004638672, 4.142597198486328, 6.496988296508789, 8.85137939453125, 11.205770492553711, 13.560161590576172, 15.914552688598633, 18.268943786621094, 20.623334884643555, 22.977725982666016, 25.332117080688477, 27.686508178710938, 30.0408992767334, 32.39529037475586, 34.74967956542969, 37.10407257080078, 39.458465576171875, 41.8128547668457, 44.16724395751953, 46.521636962890625, 48.87602996826172, 51.23041915893555, 53.584808349609375, 55.93920135498047, 58.29359436035156, 60.64798355102539, 63.00237274169922, 65.35676574707031, 67.7111587524414, 70.0655517578125, 72.41993713378906, 74.77433013916016]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 3.0, 7.0, 11.0, 11.0, 7.0, 15.0, 12.0, 23.0, 19.0, 21.0, 33.0, 28.0, 32.0, 43.0, 35.0, 39.0, 28.0, 55.0, 32.0, 48.0, 33.0, 60.0, 29.0, 41.0, 33.0, 33.0, 34.0, 38.0, 29.0, 24.0, 16.0, 21.0, 16.0, 14.0, 9.0, 10.0, 9.0, 12.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-9.75, -9.4827880859375, -9.215576171875, -8.9483642578125, -8.68115234375, -8.4139404296875, -8.146728515625, -7.8795166015625, -7.6123046875, -7.3450927734375, -7.077880859375, -6.8106689453125, -6.54345703125, -6.2762451171875, -6.009033203125, -5.7418212890625, -5.474609375, -5.2073974609375, -4.940185546875, -4.6729736328125, -4.40576171875, -4.1385498046875, -3.871337890625, -3.6041259765625, -3.3369140625, -3.0697021484375, -2.802490234375, -2.5352783203125, -2.26806640625, -2.0008544921875, -1.733642578125, -1.4664306640625, -1.19921875, -0.9320068359375, -0.664794921875, -0.3975830078125, -0.13037109375, 0.1368408203125, 0.404052734375, 0.6712646484375, 0.9384765625, 1.2056884765625, 1.472900390625, 1.7401123046875, 2.00732421875, 2.2745361328125, 2.541748046875, 2.8089599609375, 3.076171875, 3.3433837890625, 3.610595703125, 3.8778076171875, 4.14501953125, 4.4122314453125, 4.679443359375, 4.9466552734375, 5.2138671875, 5.4810791015625, 5.748291015625, 6.0155029296875, 6.28271484375, 6.5499267578125, 6.817138671875, 7.0843505859375, 7.3515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 11.0, 15.0, 15.0, 12.0, 22.0, 34.0, 57.0, 68.0, 96.0, 182.0, 251.0, 438.0, 821.0, 1523.0, 3208.0, 7767.0, 23776.0, 437568.0, 3552986.0, 137312.0, 16442.0, 6118.0, 2630.0, 1255.0, 663.0, 381.0, 211.0, 120.0, 91.0, 47.0, 38.0, 25.0, 12.0, 14.0, 18.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-41.65625, -40.510498046875, -39.36474609375, -38.218994140625, -37.0732421875, -35.927490234375, -34.78173828125, -33.635986328125, -32.490234375, -31.344482421875, -30.19873046875, -29.052978515625, -27.9072265625, -26.761474609375, -25.61572265625, -24.469970703125, -23.32421875, -22.178466796875, -21.03271484375, -19.886962890625, -18.7412109375, -17.595458984375, -16.44970703125, -15.303955078125, -14.158203125, -13.012451171875, -11.86669921875, -10.720947265625, -9.5751953125, -8.429443359375, -7.28369140625, -6.137939453125, -4.9921875, -3.846435546875, -2.70068359375, -1.554931640625, -0.4091796875, 0.736572265625, 1.88232421875, 3.028076171875, 4.173828125, 5.319580078125, 6.46533203125, 7.611083984375, 8.7568359375, 9.902587890625, 11.04833984375, 12.194091796875, 13.33984375, 14.485595703125, 15.63134765625, 16.777099609375, 17.9228515625, 19.068603515625, 20.21435546875, 21.360107421875, 22.505859375, 23.651611328125, 24.79736328125, 25.943115234375, 27.0888671875, 28.234619140625, 29.38037109375, 30.526123046875, 31.671875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 15.0, 12.0, 15.0, 17.0, 17.0, 24.0, 38.0, 53.0, 71.0, 132.0, 229.0, 444.0, 746.0, 794.0, 574.0, 324.0, 178.0, 100.0, 70.0, 48.0, 29.0, 27.0, 19.0, 14.0, 18.0, 8.0, 2.0, 3.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.015625, -24.2841796875, -23.552734375, -22.8212890625, -22.08984375, -21.3583984375, -20.626953125, -19.8955078125, -19.1640625, -18.4326171875, -17.701171875, -16.9697265625, -16.23828125, -15.5068359375, -14.775390625, -14.0439453125, -13.3125, -12.5810546875, -11.849609375, -11.1181640625, -10.38671875, -9.6552734375, -8.923828125, -8.1923828125, -7.4609375, -6.7294921875, -5.998046875, -5.2666015625, -4.53515625, -3.8037109375, -3.072265625, -2.3408203125, -1.609375, -0.8779296875, -0.146484375, 0.5849609375, 1.31640625, 2.0478515625, 2.779296875, 3.5107421875, 4.2421875, 4.9736328125, 5.705078125, 6.4365234375, 7.16796875, 7.8994140625, 8.630859375, 9.3623046875, 10.09375, 10.8251953125, 11.556640625, 12.2880859375, 13.01953125, 13.7509765625, 14.482421875, 15.2138671875, 15.9453125, 16.6767578125, 17.408203125, 18.1396484375, 18.87109375, 19.6025390625, 20.333984375, 21.0654296875, 21.796875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 9.0, 14.0, 23.0, 30.0, 48.0, 81.0, 208.0, 443.0, 1143.0, 3506.0, 12403.0, 68974.0, 3424518.0, 638717.0, 32670.0, 7762.0, 2304.0, 775.0, 284.0, 132.0, 75.0, 39.0, 17.0, 20.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0, -53.1552734375, -51.310546875, -49.4658203125, -47.62109375, -45.7763671875, -43.931640625, -42.0869140625, -40.2421875, -38.3974609375, -36.552734375, -34.7080078125, -32.86328125, -31.0185546875, -29.173828125, -27.3291015625, -25.484375, -23.6396484375, -21.794921875, -19.9501953125, -18.10546875, -16.2607421875, -14.416015625, -12.5712890625, -10.7265625, -8.8818359375, -7.037109375, -5.1923828125, -3.34765625, -1.5029296875, 0.341796875, 2.1865234375, 4.03125, 5.8759765625, 7.720703125, 9.5654296875, 11.41015625, 13.2548828125, 15.099609375, 16.9443359375, 18.7890625, 20.6337890625, 22.478515625, 24.3232421875, 26.16796875, 28.0126953125, 29.857421875, 31.7021484375, 33.546875, 35.3916015625, 37.236328125, 39.0810546875, 40.92578125, 42.7705078125, 44.615234375, 46.4599609375, 48.3046875, 50.1494140625, 51.994140625, 53.8388671875, 55.68359375, 57.5283203125, 59.373046875, 61.2177734375, 63.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 15.0, 40.0, 86.0, 210.0, 314.0, 184.0, 99.0, 24.0, 27.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.27145385742188, -189.37081909179688, -182.47018432617188, -175.56954956054688, -168.66891479492188, -161.76828002929688, -154.86764526367188, -147.96701049804688, -141.06637573242188, -134.16574096679688, -127.26510620117188, -120.36447143554688, -113.46383666992188, -106.56320190429688, -99.66256713867188, -92.76193237304688, -85.8613052368164, -78.9606704711914, -72.0600357055664, -65.1594009399414, -58.258766174316406, -51.35813522338867, -44.45750045776367, -37.55686569213867, -30.656230926513672, -23.755596160888672, -16.854961395263672, -9.954328536987305, -3.0536937713623047, 3.8469390869140625, 10.747573852539062, 17.648208618164062, 24.548843383789062, 31.449478149414062, 38.35011291503906, 45.25074768066406, 52.15138244628906, 59.0520133972168, 65.95265197753906, 72.85328674316406, 79.75392150878906, 86.65455627441406, 93.55519104003906, 100.45582580566406, 107.35646057128906, 114.25709533691406, 121.15773010253906, 128.05836486816406, 134.958984375, 141.859619140625, 148.76025390625, 155.660888671875, 162.5615234375, 169.462158203125, 176.36279296875, 183.263427734375, 190.1640625, 197.064697265625, 203.96533203125, 210.865966796875, 217.7666015625, 224.667236328125, 231.56787109375, 238.468505859375, 245.369140625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 6.0, 10.0, 9.0, 7.0, 10.0, 17.0, 26.0, 30.0, 27.0, 28.0, 32.0, 30.0, 27.0, 36.0, 43.0, 42.0, 41.0, 38.0, 53.0, 38.0, 33.0, 44.0, 44.0, 43.0, 29.0, 22.0, 38.0, 25.0, 19.0, 15.0, 20.0, 23.0, 10.0, 13.0, 11.0, 14.0, 13.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.88423156738281, -72.79228210449219, -70.70033264160156, -68.60838317871094, -66.51644134521484, -64.42449188232422, -62.332542419433594, -60.24059295654297, -58.148643493652344, -56.05669403076172, -53.96474838256836, -51.872798919677734, -49.78084945678711, -47.68890380859375, -45.596954345703125, -43.5050048828125, -41.41305923461914, -39.321109771728516, -37.229164123535156, -35.13721466064453, -33.045265197753906, -30.953317642211914, -28.861370086669922, -26.769420623779297, -24.677473068237305, -22.585525512695312, -20.493576049804688, -18.401628494262695, -16.309680938720703, -14.217731475830078, -12.125783920288086, -10.033835411071777, -7.941886901855469, -5.84993839263916, -3.7579903602600098, -1.6660423278808594, 0.4259061813354492, 2.517854690551758, 4.60980224609375, 6.701750755310059, 8.793699264526367, 10.885647773742676, 12.977596282958984, 15.069543838500977, 17.16149139404297, 19.253440856933594, 21.345388412475586, 23.437335968017578, 25.529285430908203, 27.621232986450195, 29.71318244934082, 31.805130004882812, 33.89707946777344, 35.98902893066406, 38.08097457885742, 40.17292404174805, 42.264869689941406, 44.35681915283203, 46.44876480102539, 48.540714263916016, 50.63266372680664, 52.724609375, 54.816558837890625, 56.90850830078125, 59.000457763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 1.0, 1.0, 7.0, 20.0, 17.0, 34.0, 47.0, 69.0, 93.0, 124.0, 181.0, 264.0, 393.0, 505.0, 738.0, 1009.0, 1464.0, 2066.0, 3055.0, 4376.0, 6269.0, 8951.0, 13424.0, 19406.0, 28473.0, 42531.0, 64072.0, 97826.0, 151342.0, 200244.0, 134636.0, 88194.0, 58135.0, 38539.0, 25528.0, 17286.0, 12057.0, 8230.0, 5719.0, 3911.0, 2701.0, 1952.0, 1444.0, 928.0, 693.0, 463.0, 328.0, 237.0, 154.0, 119.0, 88.0, 67.0, 40.0, 46.0, 28.0, 8.0, 13.0, 7.0, 2.0, 8.0, 3.0], "bins": [-0.1748046875, -0.1694049835205078, -0.16400527954101562, -0.15860557556152344, -0.15320587158203125, -0.14780616760253906, -0.14240646362304688, -0.1370067596435547, -0.1316070556640625, -0.1262073516845703, -0.12080764770507812, -0.11540794372558594, -0.11000823974609375, -0.10460853576660156, -0.09920883178710938, -0.09380912780761719, -0.088409423828125, -0.08300971984863281, -0.07761001586914062, -0.07221031188964844, -0.06681060791015625, -0.06141090393066406, -0.056011199951171875, -0.05061149597167969, -0.0452117919921875, -0.03981208801269531, -0.034412384033203125, -0.029012680053710938, -0.02361297607421875, -0.018213272094726562, -0.012813568115234375, -0.0074138641357421875, -0.00201416015625, 0.0033855438232421875, 0.008785247802734375, 0.014184951782226562, 0.01958465576171875, 0.024984359741210938, 0.030384063720703125, 0.03578376770019531, 0.0411834716796875, 0.04658317565917969, 0.051982879638671875, 0.05738258361816406, 0.06278228759765625, 0.06818199157714844, 0.07358169555664062, 0.07898139953613281, 0.084381103515625, 0.08978080749511719, 0.09518051147460938, 0.10058021545410156, 0.10597991943359375, 0.11137962341308594, 0.11677932739257812, 0.12217903137207031, 0.1275787353515625, 0.1329784393310547, 0.13837814331054688, 0.14377784729003906, 0.14917755126953125, 0.15457725524902344, 0.15997695922851562, 0.1653766632080078, 0.1707763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 10.0, 15.0, 13.0, 17.0, 18.0, 25.0, 32.0, 25.0, 28.0, 31.0, 41.0, 42.0, 35.0, 51.0, 48.0, 1069.0, 42.0, 55.0, 38.0, 43.0, 39.0, 49.0, 35.0, 31.0, 31.0, 30.0, 13.0, 19.0, 22.0, 15.0, 12.0, 7.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.85986328125, -5.6416015625, -5.42333984375, -5.205078125, -4.98681640625, -4.7685546875, -4.55029296875, -4.33203125, -4.11376953125, -3.8955078125, -3.67724609375, -3.458984375, -3.24072265625, -3.0224609375, -2.80419921875, -2.5859375, -2.36767578125, -2.1494140625, -1.93115234375, -1.712890625, -1.49462890625, -1.2763671875, -1.05810546875, -0.83984375, -0.62158203125, -0.4033203125, -0.18505859375, 0.033203125, 0.25146484375, 0.4697265625, 0.68798828125, 0.90625, 1.12451171875, 1.3427734375, 1.56103515625, 1.779296875, 1.99755859375, 2.2158203125, 2.43408203125, 2.65234375, 2.87060546875, 3.0888671875, 3.30712890625, 3.525390625, 3.74365234375, 3.9619140625, 4.18017578125, 4.3984375, 4.61669921875, 4.8349609375, 5.05322265625, 5.271484375, 5.48974609375, 5.7080078125, 5.92626953125, 6.14453125, 6.36279296875, 6.5810546875, 6.79931640625, 7.017578125, 7.23583984375, 7.4541015625, 7.67236328125, 7.890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 17.0, 7.0, 20.0, 31.0, 38.0, 83.0, 112.0, 166.0, 242.0, 401.0, 580.0, 948.0, 1546.0, 2628.0, 4222.0, 6810.0, 11519.0, 18829.0, 31381.0, 52477.0, 87954.0, 150086.0, 1282605.0, 181280.0, 105781.0, 62148.0, 37637.0, 22703.0, 13740.0, 8270.0, 4869.0, 3094.0, 1859.0, 1127.0, 695.0, 425.0, 293.0, 170.0, 121.0, 74.0, 51.0, 35.0, 19.0, 16.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1103515625, -0.10686779022216797, -0.10338401794433594, -0.0999002456665039, -0.09641647338867188, -0.09293270111083984, -0.08944892883300781, -0.08596515655517578, -0.08248138427734375, -0.07899761199951172, -0.07551383972167969, -0.07203006744384766, -0.06854629516601562, -0.0650625228881836, -0.06157875061035156, -0.05809497833251953, -0.0546112060546875, -0.05112743377685547, -0.04764366149902344, -0.044159889221191406, -0.040676116943359375, -0.037192344665527344, -0.03370857238769531, -0.03022480010986328, -0.02674102783203125, -0.02325725555419922, -0.019773483276367188, -0.016289710998535156, -0.012805938720703125, -0.009322166442871094, -0.0058383941650390625, -0.0023546218872070312, 0.001129150390625, 0.004612922668457031, 0.008096694946289062, 0.011580467224121094, 0.015064239501953125, 0.018548011779785156, 0.022031784057617188, 0.02551555633544922, 0.02899932861328125, 0.03248310089111328, 0.03596687316894531, 0.039450645446777344, 0.042934417724609375, 0.046418190002441406, 0.04990196228027344, 0.05338573455810547, 0.0568695068359375, 0.06035327911376953, 0.06383705139160156, 0.0673208236694336, 0.07080459594726562, 0.07428836822509766, 0.07777214050292969, 0.08125591278076172, 0.08473968505859375, 0.08822345733642578, 0.09170722961425781, 0.09519100189208984, 0.09867477416992188, 0.1021585464477539, 0.10564231872558594, 0.10912609100341797, 0.11260986328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 5.0, 6.0, 20.0, 16.0, 32.0, 24.0, 32.0, 34.0, 32.0, 45.0, 49.0, 51.0, 46.0, 50.0, 59.0, 53.0, 47.0, 56.0, 40.0, 30.0, 42.0, 29.0, 31.0, 16.0, 26.0, 16.0, 17.0, 17.0, 9.0, 12.0, 4.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0008707046508789062, -0.000844612717628479, -0.0008185207843780518, -0.0007924288511276245, -0.0007663369178771973, -0.00074024498462677, -0.0007141530513763428, -0.0006880611181259155, -0.0006619691848754883, -0.000635877251625061, -0.0006097853183746338, -0.0005836933851242065, -0.0005576014518737793, -0.000531509518623352, -0.0005054175853729248, -0.00047932565212249756, -0.0004532337188720703, -0.00042714178562164307, -0.0004010498523712158, -0.0003749579191207886, -0.00034886598587036133, -0.0003227740526199341, -0.00029668211936950684, -0.0002705901861190796, -0.00024449825286865234, -0.0002184063196182251, -0.00019231438636779785, -0.0001662224531173706, -0.00014013051986694336, -0.00011403858661651611, -8.794665336608887e-05, -6.185472011566162e-05, -3.5762786865234375e-05, -9.670853614807129e-06, 1.6421079635620117e-05, 4.251301288604736e-05, 6.860494613647461e-05, 9.469687938690186e-05, 0.0001207888126373291, 0.00014688074588775635, 0.0001729726791381836, 0.00019906461238861084, 0.00022515654563903809, 0.00025124847888946533, 0.0002773404121398926, 0.0003034323453903198, 0.00032952427864074707, 0.0003556162118911743, 0.00038170814514160156, 0.0004078000783920288, 0.00043389201164245605, 0.0004599839448928833, 0.00048607587814331055, 0.0005121678113937378, 0.000538259744644165, 0.0005643516778945923, 0.0005904436111450195, 0.0006165355443954468, 0.000642627477645874, 0.0006687194108963013, 0.0006948113441467285, 0.0007209032773971558, 0.000746995210647583, 0.0007730871438980103, 0.0007991790771484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 11.0, 13.0, 19.0, 24.0, 16.0, 39.0, 31.0, 45.0, 72.0, 88.0, 135.0, 273.0, 415.0, 882.0, 7228.0, 985463.0, 50863.0, 1447.0, 498.0, 285.0, 204.0, 133.0, 95.0, 56.0, 51.0, 44.0, 26.0, 17.0, 10.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01458740234375, -0.014112234115600586, -0.013637065887451172, -0.013161897659301758, -0.012686729431152344, -0.01221156120300293, -0.011736392974853516, -0.011261224746704102, -0.010786056518554688, -0.010310888290405273, -0.00983572006225586, -0.009360551834106445, -0.008885383605957031, -0.008410215377807617, -0.007935047149658203, -0.007459878921508789, -0.006984710693359375, -0.006509542465209961, -0.006034374237060547, -0.005559206008911133, -0.005084037780761719, -0.004608869552612305, -0.004133701324462891, -0.0036585330963134766, -0.0031833648681640625, -0.0027081966400146484, -0.0022330284118652344, -0.0017578601837158203, -0.0012826919555664062, -0.0008075237274169922, -0.0003323554992675781, 0.00014281272888183594, 0.00061798095703125, 0.001093149185180664, 0.0015683174133300781, 0.002043485641479492, 0.0025186538696289062, 0.0029938220977783203, 0.0034689903259277344, 0.0039441585540771484, 0.0044193267822265625, 0.0048944950103759766, 0.005369663238525391, 0.005844831466674805, 0.006319999694824219, 0.006795167922973633, 0.007270336151123047, 0.007745504379272461, 0.008220672607421875, 0.008695840835571289, 0.009171009063720703, 0.009646177291870117, 0.010121345520019531, 0.010596513748168945, 0.01107168197631836, 0.011546850204467773, 0.012022018432617188, 0.012497186660766602, 0.012972354888916016, 0.01344752311706543, 0.013922691345214844, 0.014397859573364258, 0.014873027801513672, 0.015348196029663086, 0.0158233642578125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 105.0, 876.0, 28.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.017937416210770607, -0.017613166943192482, -0.017288919538259506, -0.01696467027068138, -0.016640421003103256, -0.01631617359817028, -0.015991924330592155, -0.01566767506301403, -0.01534342672675848, -0.01501917839050293, -0.014694929122924805, -0.014370680786669254, -0.014046432450413704, -0.013722183182835579, -0.013397934846580029, -0.013073686510324478, -0.012749437242746353, -0.012425188906490803, -0.012100939638912678, -0.011776691302657127, -0.011452442035079002, -0.011128193698823452, -0.010803945362567902, -0.010479696094989777, -0.010155447758734226, -0.009831199422478676, -0.00950695015490055, -0.009182701818645, -0.00885845348238945, -0.008534204214811325, -0.008209955878555775, -0.007885707542300224, -0.007561459206044674, -0.007237210404127836, -0.0069129616022109985, -0.006588713265955448, -0.0062644644640386105, -0.005940215662121773, -0.005615967325866222, -0.005291718523949385, -0.004967469722032547, -0.004643220920115709, -0.004318972118198872, -0.003994723781943321, -0.0036704749800264835, -0.003346226178109646, -0.003021977609023452, -0.0026977290399372578, -0.0023734800051897764, -0.0020492314361035824, -0.0017249826341867447, -0.0014007339486852288, -0.001076485263183713, -0.0007522365776821971, -0.00042798789218068123, -0.00010373932309448719, 0.0002205094788223505, 0.0005447581643238664, 0.0008690068498253822, 0.001193255535326898, 0.001517504220828414, 0.0018417529063299298, 0.0021660015918314457, 0.0024902501609176397, 0.0028144989628344774]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 14.0, 16.0, 16.0, 29.0, 17.0, 28.0, 31.0, 42.0, 40.0, 52.0, 39.0, 45.0, 40.0, 58.0, 48.0, 45.0, 48.0, 54.0, 63.0, 46.0, 46.0, 34.0, 22.0, 21.0, 20.0, 12.0, 13.0, 11.0, 14.0, 9.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010572606697678566, -0.0010235179215669632, -0.0009897751733660698, -0.0009560324251651764, -0.000922289676964283, -0.0008885469287633896, -0.0008548041805624962, -0.0008210614323616028, -0.0007873186841607094, -0.000753575935959816, -0.0007198331877589226, -0.0006860904395580292, -0.0006523476913571358, -0.0006186049431562424, -0.000584862194955349, -0.0005511194467544556, -0.0005173766985535622, -0.00048363395035266876, -0.00044989120215177536, -0.00041614845395088196, -0.00038240570574998856, -0.00034866295754909515, -0.00031492020934820175, -0.00028117746114730835, -0.00024743471294641495, -0.00021369196474552155, -0.00017994921654462814, -0.00014620646834373474, -0.00011246372014284134, -7.872097194194794e-05, -4.4978223741054535e-05, -1.1235475540161133e-05, 2.250727266073227e-05, 5.625002086162567e-05, 8.999276906251907e-05, 0.00012373551726341248, 0.00015747826546430588, 0.00019122101366519928, 0.00022496376186609268, 0.0002587065100669861, 0.0002924492582678795, 0.0003261920064687729, 0.0003599347546696663, 0.0003936775028705597, 0.0004274202510714531, 0.0004611629992723465, 0.0004949057474732399, 0.0005286484956741333, 0.0005623912438750267, 0.0005961339920759201, 0.0006298767402768135, 0.0006636194884777069, 0.0006973622366786003, 0.0007311049848794937, 0.0007648477330803871, 0.0007985904812812805, 0.0008323332294821739, 0.0008660759776830673, 0.0008998187258839607, 0.0009335614740848541, 0.0009673042222857475, 0.001001046970486641, 0.0010347897186875343, 0.0010685324668884277]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 6.0, 17.0, 12.0, 29.0, 30.0, 39.0, 49.0, 79.0, 101.0, 141.0, 187.0, 277.0, 410.0, 602.0, 999.0, 1652.0, 2833.0, 5441.0, 12591.0, 40454.0, 603973.0, 321894.0, 33530.0, 11141.0, 5022.0, 2613.0, 1537.0, 946.0, 615.0, 412.0, 297.0, 171.0, 132.0, 81.0, 72.0, 41.0, 28.0, 24.0, 13.0, 13.0, 15.0, 8.0, 3.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203125, -23.36669921875, -22.5302734375, -21.69384765625, -20.857421875, -20.02099609375, -19.1845703125, -18.34814453125, -17.51171875, -16.67529296875, -15.8388671875, -15.00244140625, -14.166015625, -13.32958984375, -12.4931640625, -11.65673828125, -10.8203125, -9.98388671875, -9.1474609375, -8.31103515625, -7.474609375, -6.63818359375, -5.8017578125, -4.96533203125, -4.12890625, -3.29248046875, -2.4560546875, -1.61962890625, -0.783203125, 0.05322265625, 0.8896484375, 1.72607421875, 2.5625, 3.39892578125, 4.2353515625, 5.07177734375, 5.908203125, 6.74462890625, 7.5810546875, 8.41748046875, 9.25390625, 10.09033203125, 10.9267578125, 11.76318359375, 12.599609375, 13.43603515625, 14.2724609375, 15.10888671875, 15.9453125, 16.78173828125, 17.6181640625, 18.45458984375, 19.291015625, 20.12744140625, 20.9638671875, 21.80029296875, 22.63671875, 23.47314453125, 24.3095703125, 25.14599609375, 25.982421875, 26.81884765625, 27.6552734375, 28.49169921875, 29.328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 3.0, 5.0, 7.0, 8.0, 5.0, 11.0, 10.0, 19.0, 27.0, 19.0, 36.0, 29.0, 36.0, 34.0, 45.0, 45.0, 51.0, 98.0, 171.0, 1685.0, 175.0, 88.0, 64.0, 34.0, 47.0, 36.0, 38.0, 40.0, 31.0, 29.0, 16.0, 19.0, 24.0, 9.0, 16.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.07666015625, -32.0595703125, -31.04248046875, -30.025390625, -29.00830078125, -27.9912109375, -26.97412109375, -25.95703125, -24.93994140625, -23.9228515625, -22.90576171875, -21.888671875, -20.87158203125, -19.8544921875, -18.83740234375, -17.8203125, -16.80322265625, -15.7861328125, -14.76904296875, -13.751953125, -12.73486328125, -11.7177734375, -10.70068359375, -9.68359375, -8.66650390625, -7.6494140625, -6.63232421875, -5.615234375, -4.59814453125, -3.5810546875, -2.56396484375, -1.546875, -0.52978515625, 0.4873046875, 1.50439453125, 2.521484375, 3.53857421875, 4.5556640625, 5.57275390625, 6.58984375, 7.60693359375, 8.6240234375, 9.64111328125, 10.658203125, 11.67529296875, 12.6923828125, 13.70947265625, 14.7265625, 15.74365234375, 16.7607421875, 17.77783203125, 18.794921875, 19.81201171875, 20.8291015625, 21.84619140625, 22.86328125, 23.88037109375, 24.8974609375, 25.91455078125, 26.931640625, 27.94873046875, 28.9658203125, 29.98291015625, 31.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 12.0, 6.0, 17.0, 14.0, 31.0, 37.0, 30.0, 39.0, 104.0, 133.0, 281.0, 532.0, 1206.0, 3287.0, 11054.0, 77604.0, 2945764.0, 87569.0, 11888.0, 3543.0, 1342.0, 528.0, 235.0, 117.0, 81.0, 54.0, 37.0, 33.0, 25.0, 11.0, 17.0, 11.0, 10.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.6689453125, -46.900390625, -45.1318359375, -43.36328125, -41.5947265625, -39.826171875, -38.0576171875, -36.2890625, -34.5205078125, -32.751953125, -30.9833984375, -29.21484375, -27.4462890625, -25.677734375, -23.9091796875, -22.140625, -20.3720703125, -18.603515625, -16.8349609375, -15.06640625, -13.2978515625, -11.529296875, -9.7607421875, -7.9921875, -6.2236328125, -4.455078125, -2.6865234375, -0.91796875, 0.8505859375, 2.619140625, 4.3876953125, 6.15625, 7.9248046875, 9.693359375, 11.4619140625, 13.23046875, 14.9990234375, 16.767578125, 18.5361328125, 20.3046875, 22.0732421875, 23.841796875, 25.6103515625, 27.37890625, 29.1474609375, 30.916015625, 32.6845703125, 34.453125, 36.2216796875, 37.990234375, 39.7587890625, 41.52734375, 43.2958984375, 45.064453125, 46.8330078125, 48.6015625, 50.3701171875, 52.138671875, 53.9072265625, 55.67578125, 57.4443359375, 59.212890625, 60.9814453125, 62.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 41.0, 905.0, 74.0, 0.0, 1.0], "bins": [-1604.9996337890625, -1578.48681640625, -1551.973876953125, -1525.4610595703125, -1498.9482421875, -1472.435302734375, -1445.9224853515625, -1419.40966796875, -1392.896728515625, -1366.3839111328125, -1339.8709716796875, -1313.358154296875, -1286.8453369140625, -1260.3323974609375, -1233.819580078125, -1207.3067626953125, -1180.7939453125, -1154.2811279296875, -1127.7681884765625, -1101.25537109375, -1074.7425537109375, -1048.2296142578125, -1021.716796875, -995.2039794921875, -968.6910400390625, -942.1781616210938, -915.6653442382812, -889.1524658203125, -862.6395874023438, -836.1267700195312, -809.6138916015625, -783.10107421875, -756.5881958007812, -730.0753173828125, -703.5625, -677.0496215820312, -650.5367431640625, -624.02392578125, -597.5110473632812, -570.9981689453125, -544.4853515625, -517.9724731445312, -491.4596252441406, -464.94677734375, -438.4339294433594, -411.92108154296875, -385.408203125, -358.8953552246094, -332.3824768066406, -305.86962890625, -279.35675048828125, -252.84390258789062, -226.3310546875, -199.8181915283203, -173.30532836914062, -146.79248046875, -120.27960968017578, -93.76675415039062, -67.25389099121094, -40.74103546142578, -14.228179931640625, 12.284675598144531, 38.79753875732422, 65.31038665771484, 91.82324981689453]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 4.0, 12.0, 13.0, 13.0, 26.0, 14.0, 19.0, 21.0, 27.0, 23.0, 37.0, 28.0, 40.0, 42.0, 29.0, 41.0, 22.0, 38.0, 32.0, 43.0, 49.0, 45.0, 31.0, 37.0, 34.0, 26.0, 23.0, 31.0, 29.0, 23.0, 20.0, 16.0, 14.0, 16.0, 15.0, 8.0, 8.0, 6.0, 5.0, 9.0, 8.0, 1.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.74593353271484, -77.18772888183594, -74.62952423095703, -72.07131958007812, -69.51311492919922, -66.95491027832031, -64.3967056274414, -61.8385009765625, -59.280296325683594, -56.72209167480469, -54.16388702392578, -51.605682373046875, -49.04747772216797, -46.48927307128906, -43.931068420410156, -41.37286376953125, -38.814659118652344, -36.25645446777344, -33.69824981689453, -31.140045166015625, -28.58184051513672, -26.023635864257812, -23.465431213378906, -20.9072265625, -18.349021911621094, -15.790817260742188, -13.232612609863281, -10.674407958984375, -8.116203308105469, -5.5579986572265625, -2.9997940063476562, -0.44158935546875, 2.116607666015625, 4.674812316894531, 7.2330169677734375, 9.791221618652344, 12.34942626953125, 14.907630920410156, 17.465835571289062, 20.02404022216797, 22.582244873046875, 25.14044952392578, 27.698654174804688, 30.256858825683594, 32.8150634765625, 35.373268127441406, 37.93147277832031, 40.48967742919922, 43.047882080078125, 45.60608673095703, 48.16429138183594, 50.722496032714844, 53.28070068359375, 55.838905334472656, 58.39710998535156, 60.95531463623047, 63.513519287109375, 66.07172393798828, 68.62992858886719, 71.1881332397461, 73.746337890625, 76.3045425415039, 78.86274719238281, 81.42095184326172, 83.97915649414062]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 10.0, 9.0, 9.0, 8.0, 13.0, 13.0, 17.0, 21.0, 17.0, 19.0, 39.0, 29.0, 35.0, 23.0, 49.0, 43.0, 52.0, 40.0, 33.0, 50.0, 46.0, 40.0, 48.0, 43.0, 36.0, 33.0, 27.0, 30.0, 21.0, 16.0, 24.0, 18.0, 10.0, 11.0, 11.0, 11.0, 3.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.0859375, -10.7911376953125, -10.496337890625, -10.2015380859375, -9.90673828125, -9.6119384765625, -9.317138671875, -9.0223388671875, -8.7275390625, -8.4327392578125, -8.137939453125, -7.8431396484375, -7.54833984375, -7.2535400390625, -6.958740234375, -6.6639404296875, -6.369140625, -6.0743408203125, -5.779541015625, -5.4847412109375, -5.18994140625, -4.8951416015625, -4.600341796875, -4.3055419921875, -4.0107421875, -3.7159423828125, -3.421142578125, -3.1263427734375, -2.83154296875, -2.5367431640625, -2.241943359375, -1.9471435546875, -1.65234375, -1.3575439453125, -1.062744140625, -0.7679443359375, -0.47314453125, -0.1783447265625, 0.116455078125, 0.4112548828125, 0.7060546875, 1.0008544921875, 1.295654296875, 1.5904541015625, 1.88525390625, 2.1800537109375, 2.474853515625, 2.7696533203125, 3.064453125, 3.3592529296875, 3.654052734375, 3.9488525390625, 4.24365234375, 4.5384521484375, 4.833251953125, 5.1280517578125, 5.4228515625, 5.7176513671875, 6.012451171875, 6.3072509765625, 6.60205078125, 6.8968505859375, 7.191650390625, 7.4864501953125, 7.78125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 13.0, 10.0, 14.0, 12.0, 25.0, 33.0, 32.0, 57.0, 64.0, 73.0, 134.0, 181.0, 224.0, 320.0, 443.0, 570.0, 811.0, 1209.0, 1734.0, 2636.0, 4021.0, 6601.0, 11650.0, 23663.0, 105516.0, 713560.0, 2444780.0, 706215.0, 110818.0, 27797.0, 11982.0, 6706.0, 4052.0, 2649.0, 1754.0, 1129.0, 821.0, 567.0, 398.0, 285.0, 234.0, 138.0, 94.0, 78.0, 60.0, 35.0, 28.0, 27.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0], "bins": [-19.03125, -18.5098876953125, -17.988525390625, -17.4671630859375, -16.94580078125, -16.4244384765625, -15.903076171875, -15.3817138671875, -14.8603515625, -14.3389892578125, -13.817626953125, -13.2962646484375, -12.77490234375, -12.2535400390625, -11.732177734375, -11.2108154296875, -10.689453125, -10.1680908203125, -9.646728515625, -9.1253662109375, -8.60400390625, -8.0826416015625, -7.561279296875, -7.0399169921875, -6.5185546875, -5.9971923828125, -5.475830078125, -4.9544677734375, -4.43310546875, -3.9117431640625, -3.390380859375, -2.8690185546875, -2.34765625, -1.8262939453125, -1.304931640625, -0.7835693359375, -0.26220703125, 0.2591552734375, 0.780517578125, 1.3018798828125, 1.8232421875, 2.3446044921875, 2.865966796875, 3.3873291015625, 3.90869140625, 4.4300537109375, 4.951416015625, 5.4727783203125, 5.994140625, 6.5155029296875, 7.036865234375, 7.5582275390625, 8.07958984375, 8.6009521484375, 9.122314453125, 9.6436767578125, 10.1650390625, 10.6864013671875, 11.207763671875, 11.7291259765625, 12.25048828125, 12.7718505859375, 13.293212890625, 13.8145751953125, 14.3359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 10.0, 6.0, 8.0, 9.0, 10.0, 17.0, 20.0, 34.0, 45.0, 45.0, 83.0, 159.0, 280.0, 540.0, 933.0, 876.0, 426.0, 205.0, 122.0, 71.0, 46.0, 33.0, 12.0, 14.0, 23.0, 13.0, 6.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.1875, -29.267578125, -28.34765625, -27.427734375, -26.5078125, -25.587890625, -24.66796875, -23.748046875, -22.828125, -21.908203125, -20.98828125, -20.068359375, -19.1484375, -18.228515625, -17.30859375, -16.388671875, -15.46875, -14.548828125, -13.62890625, -12.708984375, -11.7890625, -10.869140625, -9.94921875, -9.029296875, -8.109375, -7.189453125, -6.26953125, -5.349609375, -4.4296875, -3.509765625, -2.58984375, -1.669921875, -0.75, 0.169921875, 1.08984375, 2.009765625, 2.9296875, 3.849609375, 4.76953125, 5.689453125, 6.609375, 7.529296875, 8.44921875, 9.369140625, 10.2890625, 11.208984375, 12.12890625, 13.048828125, 13.96875, 14.888671875, 15.80859375, 16.728515625, 17.6484375, 18.568359375, 19.48828125, 20.408203125, 21.328125, 22.248046875, 23.16796875, 24.087890625, 25.0078125, 25.927734375, 26.84765625, 27.767578125, 28.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 10.0, 12.0, 19.0, 51.0, 47.0, 87.0, 137.0, 303.0, 674.0, 1636.0, 4902.0, 18757.0, 129255.0, 3709487.0, 290481.0, 27887.0, 6676.0, 2196.0, 792.0, 374.0, 195.0, 106.0, 70.0, 34.0, 25.0, 19.0, 10.0, 9.0, 11.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.59375, -51.84375, -50.09375, -48.34375, -46.59375, -44.84375, -43.09375, -41.34375, -39.59375, -37.84375, -36.09375, -34.34375, -32.59375, -30.84375, -29.09375, -27.34375, -25.59375, -23.84375, -22.09375, -20.34375, -18.59375, -16.84375, -15.09375, -13.34375, -11.59375, -9.84375, -8.09375, -6.34375, -4.59375, -2.84375, -1.09375, 0.65625, 2.40625, 4.15625, 5.90625, 7.65625, 9.40625, 11.15625, 12.90625, 14.65625, 16.40625, 18.15625, 19.90625, 21.65625, 23.40625, 25.15625, 26.90625, 28.65625, 30.40625, 32.15625, 33.90625, 35.65625, 37.40625, 39.15625, 40.90625, 42.65625, 44.40625, 46.15625, 47.90625, 49.65625, 51.40625, 53.15625, 54.90625, 56.65625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 15.0, 27.0, 76.0, 109.0, 251.0, 253.0, 145.0, 53.0, 36.0, 20.0, 9.0, 8.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.91897583007812, -145.04087829589844, -138.16278076171875, -131.28468322753906, -124.40658569335938, -117.52848815917969, -110.650390625, -103.77229309082031, -96.89419555664062, -90.01609802246094, -83.13800048828125, -76.25990295410156, -69.38180541992188, -62.50370407104492, -55.625606536865234, -48.74750900268555, -41.869407653808594, -34.991310119628906, -28.11321258544922, -21.2351131439209, -14.357015609741211, -7.478916168212891, -0.6008186340332031, 6.277278900146484, 13.155376434326172, 20.03347396850586, 26.911571502685547, 33.7896728515625, 40.66777038574219, 47.545867919921875, 54.42396545410156, 61.30206298828125, 68.18016052246094, 75.05825805664062, 81.93635559082031, 88.814453125, 95.69255065917969, 102.57064819335938, 109.44874572753906, 116.32684326171875, 123.20494079589844, 130.08303833007812, 136.9611358642578, 143.8392333984375, 150.7173309326172, 157.59542846679688, 164.47352600097656, 171.35162353515625, 178.229736328125, 185.1078338623047, 191.98593139648438, 198.86402893066406, 205.74212646484375, 212.62022399902344, 219.49832153320312, 226.3764190673828, 233.2545166015625, 240.1326141357422, 247.01071166992188, 253.88880920410156, 260.76690673828125, 267.64501953125, 274.5231018066406, 281.4012145996094, 288.279296875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 12.0, 9.0, 10.0, 10.0, 20.0, 25.0, 9.0, 16.0, 26.0, 19.0, 25.0, 32.0, 40.0, 28.0, 41.0, 42.0, 36.0, 45.0, 40.0, 40.0, 36.0, 34.0, 39.0, 42.0, 33.0, 29.0, 27.0, 36.0, 20.0, 27.0, 23.0, 18.0, 18.0, 14.0, 8.0, 13.0, 11.0, 9.0, 8.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-65.20747375488281, -63.1240234375, -61.04057312011719, -58.957122802734375, -56.8736686706543, -54.790218353271484, -52.70676803588867, -50.62331771850586, -48.53986358642578, -46.45641326904297, -44.372962951660156, -42.289512634277344, -40.206058502197266, -38.12260818481445, -36.03915786743164, -33.95570755004883, -31.872257232666016, -29.788806915283203, -27.705354690551758, -25.621904373168945, -23.5384521484375, -21.455001831054688, -19.371551513671875, -17.288101196289062, -15.204648971557617, -13.121197700500488, -11.03774642944336, -8.954296112060547, -6.870844841003418, -4.787393569946289, -2.7039432525634766, -0.6204919815063477, 1.4629592895507812, 3.546410322189331, 5.629861354827881, 7.713312149047852, 9.79676342010498, 11.88021469116211, 13.963665008544922, 16.047115325927734, 18.13056755065918, 20.214017868041992, 22.297470092773438, 24.38092041015625, 26.464370727539062, 28.547822952270508, 30.63127326965332, 32.714725494384766, 34.79817581176758, 36.88162612915039, 38.9650764465332, 41.04853057861328, 43.131980895996094, 45.215431213378906, 47.29888153076172, 49.38233184814453, 51.465782165527344, 53.549232482910156, 55.63268280029297, 57.71613311767578, 59.79958724975586, 61.88303756713867, 63.966487884521484, 66.04994201660156, 68.13339233398438]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 10.0, 14.0, 20.0, 25.0, 42.0, 72.0, 88.0, 129.0, 188.0, 327.0, 497.0, 747.0, 1119.0, 1762.0, 2568.0, 3867.0, 5786.0, 9041.0, 13290.0, 19871.0, 29675.0, 45765.0, 71796.0, 114046.0, 182441.0, 197268.0, 123555.0, 78405.0, 50117.0, 32502.0, 21442.0, 14371.0, 9249.0, 6104.0, 4169.0, 2805.0, 1818.0, 1197.0, 772.0, 532.0, 345.0, 228.0, 160.0, 110.0, 60.0, 50.0, 22.0, 31.0, 24.0, 8.0, 11.0, 4.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1983642578125, -0.1919841766357422, -0.18560409545898438, -0.17922401428222656, -0.17284393310546875, -0.16646385192871094, -0.16008377075195312, -0.1537036895751953, -0.1473236083984375, -0.1409435272216797, -0.13456344604492188, -0.12818336486816406, -0.12180328369140625, -0.11542320251464844, -0.10904312133789062, -0.10266304016113281, -0.096282958984375, -0.08990287780761719, -0.08352279663085938, -0.07714271545410156, -0.07076263427734375, -0.06438255310058594, -0.058002471923828125, -0.05162239074707031, -0.0452423095703125, -0.03886222839355469, -0.032482147216796875, -0.026102066040039062, -0.01972198486328125, -0.013341903686523438, -0.006961822509765625, -0.0005817413330078125, 0.00579833984375, 0.012178421020507812, 0.018558502197265625, 0.024938583374023438, 0.03131866455078125, 0.03769874572753906, 0.044078826904296875, 0.05045890808105469, 0.0568389892578125, 0.06321907043457031, 0.06959915161132812, 0.07597923278808594, 0.08235931396484375, 0.08873939514160156, 0.09511947631835938, 0.10149955749511719, 0.107879638671875, 0.11425971984863281, 0.12063980102539062, 0.12701988220214844, 0.13339996337890625, 0.13978004455566406, 0.14616012573242188, 0.1525402069091797, 0.1589202880859375, 0.1653003692626953, 0.17168045043945312, 0.17806053161621094, 0.18444061279296875, 0.19082069396972656, 0.19720077514648438, 0.2035808563232422, 0.2099609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 7.0, 17.0, 12.0, 11.0, 22.0, 24.0, 22.0, 29.0, 27.0, 25.0, 28.0, 26.0, 36.0, 45.0, 32.0, 45.0, 45.0, 1062.0, 40.0, 26.0, 34.0, 38.0, 33.0, 25.0, 33.0, 31.0, 21.0, 26.0, 32.0, 22.0, 21.0, 12.0, 12.0, 14.0, 16.0, 5.0, 15.0, 2.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.625, -6.41632080078125, -6.2076416015625, -5.99896240234375, -5.790283203125, -5.58160400390625, -5.3729248046875, -5.16424560546875, -4.95556640625, -4.74688720703125, -4.5382080078125, -4.32952880859375, -4.120849609375, -3.91217041015625, -3.7034912109375, -3.49481201171875, -3.2861328125, -3.07745361328125, -2.8687744140625, -2.66009521484375, -2.451416015625, -2.24273681640625, -2.0340576171875, -1.82537841796875, -1.61669921875, -1.40802001953125, -1.1993408203125, -0.99066162109375, -0.781982421875, -0.57330322265625, -0.3646240234375, -0.15594482421875, 0.052734375, 0.26141357421875, 0.4700927734375, 0.67877197265625, 0.887451171875, 1.09613037109375, 1.3048095703125, 1.51348876953125, 1.72216796875, 1.93084716796875, 2.1395263671875, 2.34820556640625, 2.556884765625, 2.76556396484375, 2.9742431640625, 3.18292236328125, 3.3916015625, 3.60028076171875, 3.8089599609375, 4.01763916015625, 4.226318359375, 4.43499755859375, 4.6436767578125, 4.85235595703125, 5.06103515625, 5.26971435546875, 5.4783935546875, 5.68707275390625, 5.895751953125, 6.10443115234375, 6.3131103515625, 6.52178955078125, 6.73046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 8.0, 13.0, 12.0, 23.0, 35.0, 37.0, 63.0, 95.0, 117.0, 174.0, 255.0, 344.0, 534.0, 687.0, 1041.0, 1453.0, 2057.0, 2982.0, 4537.0, 6308.0, 9226.0, 13232.0, 19364.0, 28493.0, 41017.0, 59968.0, 88889.0, 133187.0, 1227620.0, 146327.0, 98426.0, 66002.0, 44808.0, 31213.0, 21449.0, 14731.0, 9805.0, 6926.0, 4777.0, 3335.0, 2264.0, 1522.0, 1153.0, 769.0, 534.0, 372.0, 253.0, 214.0, 146.0, 82.0, 90.0, 55.0, 33.0, 29.0, 14.0, 13.0, 9.0, 4.0, 6.0, 3.0, 3.0], "bins": [-0.08935546875, -0.08652973175048828, -0.08370399475097656, -0.08087825775146484, -0.07805252075195312, -0.0752267837524414, -0.07240104675292969, -0.06957530975341797, -0.06674957275390625, -0.06392383575439453, -0.06109809875488281, -0.058272361755371094, -0.055446624755859375, -0.052620887756347656, -0.04979515075683594, -0.04696941375732422, -0.0441436767578125, -0.04131793975830078, -0.03849220275878906, -0.035666465759277344, -0.032840728759765625, -0.030014991760253906, -0.027189254760742188, -0.02436351776123047, -0.02153778076171875, -0.01871204376220703, -0.015886306762695312, -0.013060569763183594, -0.010234832763671875, -0.007409095764160156, -0.0045833587646484375, -0.0017576217651367188, 0.001068115234375, 0.0038938522338867188, 0.0067195892333984375, 0.009545326232910156, 0.012371063232421875, 0.015196800231933594, 0.018022537231445312, 0.02084827423095703, 0.02367401123046875, 0.02649974822998047, 0.029325485229492188, 0.032151222229003906, 0.034976959228515625, 0.037802696228027344, 0.04062843322753906, 0.04345417022705078, 0.0462799072265625, 0.04910564422607422, 0.05193138122558594, 0.054757118225097656, 0.057582855224609375, 0.060408592224121094, 0.06323432922363281, 0.06606006622314453, 0.06888580322265625, 0.07171154022216797, 0.07453727722167969, 0.0773630142211914, 0.08018875122070312, 0.08301448822021484, 0.08584022521972656, 0.08866596221923828, 0.09149169921875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 9.0, 8.0, 13.0, 10.0, 16.0, 15.0, 18.0, 29.0, 35.0, 31.0, 40.0, 52.0, 44.0, 55.0, 49.0, 56.0, 55.0, 39.0, 40.0, 43.0, 43.0, 42.0, 42.0, 36.0, 21.0, 30.0, 19.0, 14.0, 17.0, 9.0, 8.0, 12.0, 7.0, 2.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0010166168212890625, -0.0009859949350357056, -0.0009553730487823486, -0.0009247511625289917, -0.0008941292762756348, -0.0008635073900222778, -0.0008328855037689209, -0.000802263617515564, -0.000771641731262207, -0.0007410198450088501, -0.0007103979587554932, -0.0006797760725021362, -0.0006491541862487793, -0.0006185322999954224, -0.0005879104137420654, -0.0005572885274887085, -0.0005266666412353516, -0.0004960447549819946, -0.0004654228687286377, -0.00043480098247528076, -0.00040417909622192383, -0.0003735572099685669, -0.00034293532371520996, -0.00031231343746185303, -0.0002816915512084961, -0.00025106966495513916, -0.00022044777870178223, -0.0001898258924484253, -0.00015920400619506836, -0.00012858211994171143, -9.796023368835449e-05, -6.733834743499756e-05, -3.6716461181640625e-05, -6.094574928283691e-06, 2.4527311325073242e-05, 5.5149197578430176e-05, 8.577108383178711e-05, 0.00011639297008514404, 0.00014701485633850098, 0.0001776367425918579, 0.00020825862884521484, 0.00023888051509857178, 0.0002695024013519287, 0.00030012428760528564, 0.0003307461738586426, 0.0003613680601119995, 0.00039198994636535645, 0.0004226118326187134, 0.0004532337188720703, 0.00048385560512542725, 0.0005144774913787842, 0.0005450993776321411, 0.000575721263885498, 0.000606343150138855, 0.0006369650363922119, 0.0006675869226455688, 0.0006982088088989258, 0.0007288306951522827, 0.0007594525814056396, 0.0007900744676589966, 0.0008206963539123535, 0.0008513182401657104, 0.0008819401264190674, 0.0009125620126724243, 0.0009431838989257812]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 14.0, 13.0, 14.0, 18.0, 22.0, 28.0, 35.0, 75.0, 103.0, 158.0, 244.0, 480.0, 1127.0, 28473.0, 1008390.0, 7349.0, 879.0, 402.0, 216.0, 134.0, 83.0, 58.0, 50.0, 32.0, 25.0, 22.0, 12.0, 9.0, 11.0, 10.0, 7.0, 5.0, 10.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017810821533203125, -0.01720428466796875, -0.016597747802734375, -0.0159912109375, -0.015384674072265625, -0.01477813720703125, -0.014171600341796875, -0.0135650634765625, -0.012958526611328125, -0.01235198974609375, -0.011745452880859375, -0.011138916015625, -0.010532379150390625, -0.00992584228515625, -0.009319305419921875, -0.0087127685546875, -0.008106231689453125, -0.00749969482421875, -0.006893157958984375, -0.00628662109375, -0.005680084228515625, -0.00507354736328125, -0.004467010498046875, -0.0038604736328125, -0.003253936767578125, -0.00264739990234375, -0.002040863037109375, -0.001434326171875, -0.000827789306640625, -0.00022125244140625, 0.000385284423828125, 0.0009918212890625, 0.001598358154296875, 0.00220489501953125, 0.002811431884765625, 0.00341796875, 0.004024505615234375, 0.00463104248046875, 0.005237579345703125, 0.0058441162109375, 0.006450653076171875, 0.00705718994140625, 0.007663726806640625, 0.008270263671875, 0.008876800537109375, 0.00948333740234375, 0.010089874267578125, 0.0106964111328125, 0.011302947998046875, 0.01190948486328125, 0.012516021728515625, 0.01312255859375, 0.013729095458984375, 0.01433563232421875, 0.014942169189453125, 0.0155487060546875, 0.016155242919921875, 0.01676177978515625, 0.017368316650390625, 0.017974853515625, 0.018581390380859375, 0.01918792724609375, 0.019794464111328125, 0.0204010009765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 353.0, 658.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03300518915057182, -0.032426510006189346, -0.03184782713651657, -0.031269147992134094, -0.03069046512246132, -0.030111784115433693, -0.029533103108406067, -0.02895442396402359, -0.028375741094350815, -0.02779706008732319, -0.027218379080295563, -0.026639698073267937, -0.02606101706624031, -0.025482336059212685, -0.02490365505218506, -0.024324975907802582, -0.023746294900774956, -0.02316761389374733, -0.022588932886719704, -0.022010251879692078, -0.02143157087266445, -0.020852889865636826, -0.0202742088586092, -0.019695527851581573, -0.019116848707199097, -0.01853816770017147, -0.017959486693143845, -0.01738080568611622, -0.016802124679088593, -0.016223443672060966, -0.01564476266503334, -0.015066082589328289, -0.014487400650978088, -0.013908719643950462, -0.013330038636922836, -0.01275135762989521, -0.012172676622867584, -0.011593995615839958, -0.011015315540134907, -0.01043663453310728, -0.009857953526079655, -0.009279272519052029, -0.008700591512024403, -0.008121910504996777, -0.007543229963630438, -0.006964548956602812, -0.006385868415236473, -0.005807187408208847, -0.005228506401181221, -0.004649825394153595, -0.004071144387125969, -0.00349246384575963, -0.002913782838732004, -0.002335101831704378, -0.0017564210575073957, -0.0011777402833104134, -0.0005990592762827873, -2.0378385670483112e-05, 0.0005583025049418211, 0.0011369833955541253, 0.0017156642861664295, 0.0022943452931940556, 0.002873026067391038, 0.0034517068415880203, 0.004030387848615646]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 19.0, 19.0, 25.0, 21.0, 25.0, 35.0, 29.0, 41.0, 61.0, 56.0, 63.0, 64.0, 75.0, 64.0, 49.0, 62.0, 55.0, 37.0, 25.0, 27.0, 34.0, 18.0, 20.0, 16.0, 11.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001224815845489502, -0.0011795097962021828, -0.0011342037469148636, -0.0010888976976275444, -0.0010435916483402252, -0.000998285599052906, -0.0009529795497655869, -0.0009076735004782677, -0.0008623674511909485, -0.0008170614019036293, -0.0007717553526163101, -0.0007264493033289909, -0.0006811432540416718, -0.0006358372047543526, -0.0005905311554670334, -0.0005452251061797142, -0.000499919056892395, -0.00045461300760507584, -0.00040930695831775665, -0.00036400090903043747, -0.0003186948597431183, -0.0002733888104557991, -0.00022808276116847992, -0.00018277671188116074, -0.00013747066259384155, -9.216461330652237e-05, -4.6858564019203186e-05, -1.5525147318840027e-06, 4.375353455543518e-05, 8.905958384275436e-05, 0.00013436563313007355, 0.00017967168241739273, 0.00022497773170471191, 0.0002702837809920311, 0.0003155898302793503, 0.00036089587956666946, 0.00040620192885398865, 0.00045150797814130783, 0.000496814027428627, 0.0005421200767159462, 0.0005874261260032654, 0.0006327321752905846, 0.0006780382245779037, 0.0007233442738652229, 0.0007686503231525421, 0.0008139563724398613, 0.0008592624217271805, 0.0009045684710144997, 0.0009498745203018188, 0.000995180569589138, 0.0010404866188764572, 0.0010857926681637764, 0.0011310987174510956, 0.0011764047667384148, 0.001221710816025734, 0.0012670168653130531, 0.0013123229146003723, 0.0013576289638876915, 0.0014029350131750107, 0.0014482410624623299, 0.001493547111749649, 0.0015388531610369682, 0.0015841592103242874, 0.0016294652596116066, 0.0016747713088989258]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 11.0, 9.0, 22.0, 26.0, 38.0, 46.0, 56.0, 117.0, 130.0, 179.0, 292.0, 352.0, 610.0, 869.0, 1427.0, 2291.0, 3905.0, 7545.0, 16775.0, 48818.0, 246793.0, 578209.0, 90315.0, 25894.0, 10732.0, 5056.0, 2949.0, 1746.0, 1094.0, 707.0, 445.0, 322.0, 222.0, 151.0, 124.0, 72.0, 55.0, 28.0, 38.0, 16.0, 11.0, 11.0, 12.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-18.65625, -18.1265869140625, -17.596923828125, -17.0672607421875, -16.53759765625, -16.0079345703125, -15.478271484375, -14.9486083984375, -14.4189453125, -13.8892822265625, -13.359619140625, -12.8299560546875, -12.30029296875, -11.7706298828125, -11.240966796875, -10.7113037109375, -10.181640625, -9.6519775390625, -9.122314453125, -8.5926513671875, -8.06298828125, -7.5333251953125, -7.003662109375, -6.4739990234375, -5.9443359375, -5.4146728515625, -4.885009765625, -4.3553466796875, -3.82568359375, -3.2960205078125, -2.766357421875, -2.2366943359375, -1.70703125, -1.1773681640625, -0.647705078125, -0.1180419921875, 0.41162109375, 0.9412841796875, 1.470947265625, 2.0006103515625, 2.5302734375, 3.0599365234375, 3.589599609375, 4.1192626953125, 4.64892578125, 5.1785888671875, 5.708251953125, 6.2379150390625, 6.767578125, 7.2972412109375, 7.826904296875, 8.3565673828125, 8.88623046875, 9.4158935546875, 9.945556640625, 10.4752197265625, 11.0048828125, 11.5345458984375, 12.064208984375, 12.5938720703125, 13.12353515625, 13.6531982421875, 14.182861328125, 14.7125244140625, 15.2421875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 2.0, 4.0, 7.0, 10.0, 10.0, 12.0, 20.0, 15.0, 25.0, 33.0, 33.0, 38.0, 44.0, 54.0, 86.0, 106.0, 231.0, 1662.0, 180.0, 93.0, 72.0, 42.0, 55.0, 32.0, 36.0, 29.0, 22.0, 16.0, 19.0, 11.0, 15.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.29736328125, -34.9697265625, -33.64208984375, -32.314453125, -30.98681640625, -29.6591796875, -28.33154296875, -27.00390625, -25.67626953125, -24.3486328125, -23.02099609375, -21.693359375, -20.36572265625, -19.0380859375, -17.71044921875, -16.3828125, -15.05517578125, -13.7275390625, -12.39990234375, -11.072265625, -9.74462890625, -8.4169921875, -7.08935546875, -5.76171875, -4.43408203125, -3.1064453125, -1.77880859375, -0.451171875, 0.87646484375, 2.2041015625, 3.53173828125, 4.859375, 6.18701171875, 7.5146484375, 8.84228515625, 10.169921875, 11.49755859375, 12.8251953125, 14.15283203125, 15.48046875, 16.80810546875, 18.1357421875, 19.46337890625, 20.791015625, 22.11865234375, 23.4462890625, 24.77392578125, 26.1015625, 27.42919921875, 28.7568359375, 30.08447265625, 31.412109375, 32.73974609375, 34.0673828125, 35.39501953125, 36.72265625, 38.05029296875, 39.3779296875, 40.70556640625, 42.033203125, 43.36083984375, 44.6884765625, 46.01611328125, 47.34375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 15.0, 19.0, 27.0, 33.0, 52.0, 66.0, 73.0, 112.0, 198.0, 388.0, 1237.0, 9768.0, 761521.0, 2356929.0, 12689.0, 1465.0, 416.0, 170.0, 124.0, 96.0, 71.0, 39.0, 44.0, 34.0, 24.0, 17.0, 12.0, 7.0, 4.0, 6.0, 11.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-84.8125, -82.4599609375, -80.107421875, -77.7548828125, -75.40234375, -73.0498046875, -70.697265625, -68.3447265625, -65.9921875, -63.6396484375, -61.287109375, -58.9345703125, -56.58203125, -54.2294921875, -51.876953125, -49.5244140625, -47.171875, -44.8193359375, -42.466796875, -40.1142578125, -37.76171875, -35.4091796875, -33.056640625, -30.7041015625, -28.3515625, -25.9990234375, -23.646484375, -21.2939453125, -18.94140625, -16.5888671875, -14.236328125, -11.8837890625, -9.53125, -7.1787109375, -4.826171875, -2.4736328125, -0.12109375, 2.2314453125, 4.583984375, 6.9365234375, 9.2890625, 11.6416015625, 13.994140625, 16.3466796875, 18.69921875, 21.0517578125, 23.404296875, 25.7568359375, 28.109375, 30.4619140625, 32.814453125, 35.1669921875, 37.51953125, 39.8720703125, 42.224609375, 44.5771484375, 46.9296875, 49.2822265625, 51.634765625, 53.9873046875, 56.33984375, 58.6923828125, 61.044921875, 63.3974609375, 65.75]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 266.0, 751.0], "bins": [-1739.109375, -1711.553466796875, -1683.9976806640625, -1656.4417724609375, -1628.8858642578125, -1601.3299560546875, -1573.774169921875, -1546.21826171875, -1518.662353515625, -1491.1064453125, -1463.5506591796875, -1435.9947509765625, -1408.4388427734375, -1380.8829345703125, -1353.3271484375, -1325.771240234375, -1298.21533203125, -1270.659423828125, -1243.1036376953125, -1215.5477294921875, -1187.9918212890625, -1160.4359130859375, -1132.880126953125, -1105.32421875, -1077.7684326171875, -1050.2125244140625, -1022.6566772460938, -995.100830078125, -967.544921875, -939.9890747070312, -912.4332275390625, -884.8773193359375, -857.3213500976562, -829.7655029296875, -802.2095947265625, -774.6537475585938, -747.0978393554688, -719.5419921875, -691.986083984375, -664.4302368164062, -636.8743896484375, -609.3185424804688, -581.7626342773438, -554.206787109375, -526.65087890625, -499.09503173828125, -471.5391540527344, -443.9832763671875, -416.4273986816406, -388.87152099609375, -361.3156433105469, -333.759765625, -306.20391845703125, -278.64801025390625, -251.0921630859375, -223.53628540039062, -195.9803924560547, -168.4245147705078, -140.86865234375, -113.31277465820312, -85.75689697265625, -58.201019287109375, -30.645156860351562, -3.0892791748046875, 24.466596603393555]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 11.0, 7.0, 7.0, 12.0, 10.0, 10.0, 10.0, 22.0, 16.0, 32.0, 28.0, 36.0, 34.0, 44.0, 38.0, 36.0, 48.0, 30.0, 39.0, 49.0, 37.0, 42.0, 38.0, 37.0, 40.0, 36.0, 36.0, 25.0, 37.0, 19.0, 21.0, 17.0, 16.0, 12.0, 12.0, 10.0, 10.0, 15.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.80767822265625, -81.05241394042969, -78.29714965820312, -75.5418930053711, -72.78662872314453, -70.03136444091797, -67.27610778808594, -64.52084350585938, -61.76557922363281, -59.01031494140625, -56.25505447387695, -53.499794006347656, -50.744529724121094, -47.98926544189453, -45.234004974365234, -42.47874450683594, -39.723480224609375, -36.96821594238281, -34.212955474853516, -31.457693099975586, -28.702430725097656, -25.947168350219727, -23.191905975341797, -20.436643600463867, -17.681381225585938, -14.926118850708008, -12.170856475830078, -9.415594100952148, -6.660331726074219, -3.905069351196289, -1.1498069763183594, 1.6054553985595703, 4.3607177734375, 7.11598014831543, 9.87124252319336, 12.626504898071289, 15.381767272949219, 18.13702964782715, 20.892292022705078, 23.647554397583008, 26.402816772460938, 29.158079147338867, 31.913341522216797, 34.668601989746094, 37.423866271972656, 40.17913055419922, 42.934391021728516, 45.68965148925781, 48.444915771484375, 51.20018005371094, 53.955440521240234, 56.71070098876953, 59.465965270996094, 62.221229553222656, 64.97648620605469, 67.73175048828125, 70.48701477050781, 73.24227905273438, 75.99754333496094, 78.75279998779297, 81.50806427001953, 84.2633285522461, 87.01858520507812, 89.77384948730469, 92.52911376953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 2.0, 3.0, 6.0, 11.0, 11.0, 9.0, 16.0, 16.0, 20.0, 17.0, 20.0, 32.0, 23.0, 32.0, 29.0, 40.0, 31.0, 42.0, 50.0, 53.0, 41.0, 42.0, 46.0, 46.0, 49.0, 42.0, 31.0, 28.0, 30.0, 27.0, 17.0, 17.0, 20.0, 16.0, 15.0, 19.0, 11.0, 6.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8046875, -11.4803466796875, -11.156005859375, -10.8316650390625, -10.50732421875, -10.1829833984375, -9.858642578125, -9.5343017578125, -9.2099609375, -8.8856201171875, -8.561279296875, -8.2369384765625, -7.91259765625, -7.5882568359375, -7.263916015625, -6.9395751953125, -6.615234375, -6.2908935546875, -5.966552734375, -5.6422119140625, -5.31787109375, -4.9935302734375, -4.669189453125, -4.3448486328125, -4.0205078125, -3.6961669921875, -3.371826171875, -3.0474853515625, -2.72314453125, -2.3988037109375, -2.074462890625, -1.7501220703125, -1.42578125, -1.1014404296875, -0.777099609375, -0.4527587890625, -0.12841796875, 0.1959228515625, 0.520263671875, 0.8446044921875, 1.1689453125, 1.4932861328125, 1.817626953125, 2.1419677734375, 2.46630859375, 2.7906494140625, 3.114990234375, 3.4393310546875, 3.763671875, 4.0880126953125, 4.412353515625, 4.7366943359375, 5.06103515625, 5.3853759765625, 5.709716796875, 6.0340576171875, 6.3583984375, 6.6827392578125, 7.007080078125, 7.3314208984375, 7.65576171875, 7.9801025390625, 8.304443359375, 8.6287841796875, 8.953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 5.0, 12.0, 10.0, 21.0, 24.0, 27.0, 33.0, 46.0, 66.0, 96.0, 192.0, 257.0, 472.0, 994.0, 2276.0, 5838.0, 18281.0, 221331.0, 3653669.0, 261517.0, 19055.0, 5786.0, 2169.0, 935.0, 429.0, 262.0, 119.0, 85.0, 62.0, 47.0, 28.0, 30.0, 17.0, 26.0, 15.0, 8.0, 3.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -46.10791015625, -44.8095703125, -43.51123046875, -42.212890625, -40.91455078125, -39.6162109375, -38.31787109375, -37.01953125, -35.72119140625, -34.4228515625, -33.12451171875, -31.826171875, -30.52783203125, -29.2294921875, -27.93115234375, -26.6328125, -25.33447265625, -24.0361328125, -22.73779296875, -21.439453125, -20.14111328125, -18.8427734375, -17.54443359375, -16.24609375, -14.94775390625, -13.6494140625, -12.35107421875, -11.052734375, -9.75439453125, -8.4560546875, -7.15771484375, -5.859375, -4.56103515625, -3.2626953125, -1.96435546875, -0.666015625, 0.63232421875, 1.9306640625, 3.22900390625, 4.52734375, 5.82568359375, 7.1240234375, 8.42236328125, 9.720703125, 11.01904296875, 12.3173828125, 13.61572265625, 14.9140625, 16.21240234375, 17.5107421875, 18.80908203125, 20.107421875, 21.40576171875, 22.7041015625, 24.00244140625, 25.30078125, 26.59912109375, 27.8974609375, 29.19580078125, 30.494140625, 31.79248046875, 33.0908203125, 34.38916015625, 35.6875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 11.0, 6.0, 16.0, 11.0, 18.0, 22.0, 30.0, 37.0, 56.0, 95.0, 166.0, 329.0, 648.0, 833.0, 773.0, 420.0, 222.0, 125.0, 61.0, 41.0, 36.0, 20.0, 19.0, 21.0, 19.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.166015625, -32.23828125, -31.310546875, -30.3828125, -29.455078125, -28.52734375, -27.599609375, -26.671875, -25.744140625, -24.81640625, -23.888671875, -22.9609375, -22.033203125, -21.10546875, -20.177734375, -19.25, -18.322265625, -17.39453125, -16.466796875, -15.5390625, -14.611328125, -13.68359375, -12.755859375, -11.828125, -10.900390625, -9.97265625, -9.044921875, -8.1171875, -7.189453125, -6.26171875, -5.333984375, -4.40625, -3.478515625, -2.55078125, -1.623046875, -0.6953125, 0.232421875, 1.16015625, 2.087890625, 3.015625, 3.943359375, 4.87109375, 5.798828125, 6.7265625, 7.654296875, 8.58203125, 9.509765625, 10.4375, 11.365234375, 12.29296875, 13.220703125, 14.1484375, 15.076171875, 16.00390625, 16.931640625, 17.859375, 18.787109375, 19.71484375, 20.642578125, 21.5703125, 22.498046875, 23.42578125, 24.353515625, 25.28125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 12.0, 18.0, 31.0, 28.0, 48.0, 96.0, 175.0, 447.0, 1269.0, 4109.0, 18060.0, 158441.0, 3820213.0, 166582.0, 18326.0, 4249.0, 1276.0, 438.0, 178.0, 105.0, 51.0, 22.0, 19.0, 20.0, 19.0, 7.0, 11.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.59375, -53.57275390625, -51.5517578125, -49.53076171875, -47.509765625, -45.48876953125, -43.4677734375, -41.44677734375, -39.42578125, -37.40478515625, -35.3837890625, -33.36279296875, -31.341796875, -29.32080078125, -27.2998046875, -25.27880859375, -23.2578125, -21.23681640625, -19.2158203125, -17.19482421875, -15.173828125, -13.15283203125, -11.1318359375, -9.11083984375, -7.08984375, -5.06884765625, -3.0478515625, -1.02685546875, 0.994140625, 3.01513671875, 5.0361328125, 7.05712890625, 9.078125, 11.09912109375, 13.1201171875, 15.14111328125, 17.162109375, 19.18310546875, 21.2041015625, 23.22509765625, 25.24609375, 27.26708984375, 29.2880859375, 31.30908203125, 33.330078125, 35.35107421875, 37.3720703125, 39.39306640625, 41.4140625, 43.43505859375, 45.4560546875, 47.47705078125, 49.498046875, 51.51904296875, 53.5400390625, 55.56103515625, 57.58203125, 59.60302734375, 61.6240234375, 63.64501953125, 65.666015625, 67.68701171875, 69.7080078125, 71.72900390625, 73.75]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 12.0, 30.0, 25.0, 35.0, 64.0, 82.0, 110.0, 143.0, 130.0, 110.0, 88.0, 49.0, 40.0, 22.0, 22.0, 12.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.06134033203125, -50.48974609375, -46.91815185546875, -43.346561431884766, -39.774967193603516, -36.203372955322266, -32.63178253173828, -29.06018829345703, -25.48859405517578, -21.91699981689453, -18.345407485961914, -14.77381420135498, -11.202220916748047, -7.630626678466797, -4.05903434753418, -0.4874420166015625, 3.0841522216796875, 6.655745506286621, 10.227338790893555, 13.798932075500488, 17.370525360107422, 20.942119598388672, 24.51371192932129, 28.085304260253906, 31.656898498535156, 35.228492736816406, 38.800086975097656, 42.37167739868164, 45.94327163696289, 49.51486587524414, 53.086456298828125, 56.658050537109375, 60.229644775390625, 63.801239013671875, 67.37283325195312, 70.94442749023438, 74.51602172851562, 78.08761596679688, 81.6592025756836, 85.23079681396484, 88.8023910522461, 92.37398529052734, 95.9455795288086, 99.51717376708984, 103.08876037597656, 106.66035461425781, 110.23194885253906, 113.80354309082031, 117.37513732910156, 120.94673156738281, 124.51832580566406, 128.0899200439453, 131.66151428222656, 135.2331085205078, 138.80470275878906, 142.37628173828125, 145.9478759765625, 149.51947021484375, 153.091064453125, 156.66265869140625, 160.2342529296875, 163.80584716796875, 167.37744140625, 170.94903564453125, 174.5206298828125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 12.0, 17.0, 18.0, 20.0, 13.0, 20.0, 16.0, 26.0, 24.0, 23.0, 22.0, 31.0, 40.0, 40.0, 34.0, 36.0, 35.0, 41.0, 36.0, 41.0, 40.0, 34.0, 50.0, 34.0, 34.0, 34.0, 29.0, 18.0, 14.0, 24.0, 19.0, 9.0, 19.0, 18.0, 9.0, 7.0, 5.0, 6.0, 4.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-70.21063995361328, -68.07457733154297, -65.93851470947266, -63.802452087402344, -61.6663932800293, -59.530330657958984, -57.39426803588867, -55.25820541381836, -53.12214660644531, -50.986083984375, -48.85002136230469, -46.713958740234375, -44.57789993286133, -42.441837310791016, -40.3057746887207, -38.16971206665039, -36.03364944458008, -33.897586822509766, -31.761526107788086, -29.625463485717773, -27.489402770996094, -25.35334014892578, -23.21727752685547, -21.081214904785156, -18.945154190063477, -16.809091567993164, -14.673030853271484, -12.536968231201172, -10.400906562805176, -8.26484489440918, -6.128782272338867, -3.992720603942871, -1.856658935546875, 0.2794029712677002, 2.4154648780822754, 4.55152702331543, 6.687588691711426, 8.823650360107422, 10.959712982177734, 13.09577465057373, 15.231836318969727, 17.36789894104004, 19.50395965576172, 21.64002227783203, 23.776084899902344, 25.912145614624023, 28.048208236694336, 30.184268951416016, 32.32033157348633, 34.45639419555664, 36.59245681762695, 38.728515625, 40.86457824707031, 43.000640869140625, 45.13670349121094, 47.27276611328125, 49.40882873535156, 51.544891357421875, 53.68095397949219, 55.8170166015625, 57.95307540893555, 60.08913803100586, 62.22520065307617, 64.36125946044922, 66.49732208251953]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 15.0, 18.0, 30.0, 42.0, 77.0, 97.0, 165.0, 222.0, 309.0, 433.0, 668.0, 907.0, 1284.0, 1815.0, 2550.0, 3673.0, 5007.0, 7467.0, 10665.0, 15277.0, 22079.0, 32237.0, 48584.0, 73283.0, 114971.0, 178679.0, 180405.0, 116513.0, 74597.0, 49311.0, 33248.0, 22388.0, 15369.0, 10885.0, 7527.0, 5285.0, 3703.0, 2666.0, 1840.0, 1258.0, 956.0, 685.0, 436.0, 307.0, 197.0, 125.0, 120.0, 76.0, 39.0, 14.0, 14.0, 19.0, 9.0, 6.0, 2.0, 3.0], "bins": [-0.211669921875, -0.20544815063476562, -0.19922637939453125, -0.19300460815429688, -0.1867828369140625, -0.18056106567382812, -0.17433929443359375, -0.16811752319335938, -0.161895751953125, -0.15567398071289062, -0.14945220947265625, -0.14323043823242188, -0.1370086669921875, -0.13078689575195312, -0.12456512451171875, -0.11834335327148438, -0.11212158203125, -0.10589981079101562, -0.09967803955078125, -0.09345626831054688, -0.0872344970703125, -0.08101272583007812, -0.07479095458984375, -0.06856918334960938, -0.062347412109375, -0.056125640869140625, -0.04990386962890625, -0.043682098388671875, -0.0374603271484375, -0.031238555908203125, -0.02501678466796875, -0.018795013427734375, -0.0125732421875, -0.006351470947265625, -0.00012969970703125, 0.006092071533203125, 0.0123138427734375, 0.018535614013671875, 0.02475738525390625, 0.030979156494140625, 0.037200927734375, 0.043422698974609375, 0.04964447021484375, 0.055866241455078125, 0.0620880126953125, 0.06830978393554688, 0.07453155517578125, 0.08075332641601562, 0.08697509765625, 0.09319686889648438, 0.09941864013671875, 0.10564041137695312, 0.1118621826171875, 0.11808395385742188, 0.12430572509765625, 0.13052749633789062, 0.136749267578125, 0.14297103881835938, 0.14919281005859375, 0.15541458129882812, 0.1616363525390625, 0.16785812377929688, 0.17407989501953125, 0.18030166625976562, 0.1865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 8.0, 8.0, 13.0, 14.0, 15.0, 19.0, 25.0, 28.0, 28.0, 31.0, 42.0, 29.0, 34.0, 38.0, 44.0, 39.0, 39.0, 1077.0, 47.0, 45.0, 42.0, 42.0, 43.0, 28.0, 33.0, 30.0, 21.0, 28.0, 18.0, 13.0, 11.0, 15.0, 14.0, 7.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.234375, -6.9774169921875, -6.720458984375, -6.4635009765625, -6.20654296875, -5.9495849609375, -5.692626953125, -5.4356689453125, -5.1787109375, -4.9217529296875, -4.664794921875, -4.4078369140625, -4.15087890625, -3.8939208984375, -3.636962890625, -3.3800048828125, -3.123046875, -2.8660888671875, -2.609130859375, -2.3521728515625, -2.09521484375, -1.8382568359375, -1.581298828125, -1.3243408203125, -1.0673828125, -0.8104248046875, -0.553466796875, -0.2965087890625, -0.03955078125, 0.2174072265625, 0.474365234375, 0.7313232421875, 0.98828125, 1.2452392578125, 1.502197265625, 1.7591552734375, 2.01611328125, 2.2730712890625, 2.530029296875, 2.7869873046875, 3.0439453125, 3.3009033203125, 3.557861328125, 3.8148193359375, 4.07177734375, 4.3287353515625, 4.585693359375, 4.8426513671875, 5.099609375, 5.3565673828125, 5.613525390625, 5.8704833984375, 6.12744140625, 6.3843994140625, 6.641357421875, 6.8983154296875, 7.1552734375, 7.4122314453125, 7.669189453125, 7.9261474609375, 8.18310546875, 8.4400634765625, 8.697021484375, 8.9539794921875, 9.2109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 21.0, 25.0, 42.0, 67.0, 91.0, 125.0, 213.0, 281.0, 399.0, 617.0, 870.0, 1297.0, 1905.0, 2792.0, 4256.0, 6508.0, 9810.0, 14706.0, 22952.0, 35822.0, 55471.0, 91191.0, 152594.0, 1269645.0, 161718.0, 96723.0, 59217.0, 37749.0, 24023.0, 15623.0, 10245.0, 6714.0, 4399.0, 2856.0, 1891.0, 1326.0, 871.0, 654.0, 427.0, 301.0, 211.0, 150.0, 111.0, 64.0, 43.0, 40.0, 15.0, 16.0, 7.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.110107421875, -0.10650444030761719, -0.10290145874023438, -0.09929847717285156, -0.09569549560546875, -0.09209251403808594, -0.08848953247070312, -0.08488655090332031, -0.0812835693359375, -0.07768058776855469, -0.07407760620117188, -0.07047462463378906, -0.06687164306640625, -0.06326866149902344, -0.059665679931640625, -0.05606269836425781, -0.052459716796875, -0.04885673522949219, -0.045253753662109375, -0.04165077209472656, -0.03804779052734375, -0.03444480895996094, -0.030841827392578125, -0.027238845825195312, -0.0236358642578125, -0.020032882690429688, -0.016429901123046875, -0.012826919555664062, -0.00922393798828125, -0.0056209564208984375, -0.002017974853515625, 0.0015850067138671875, 0.00518798828125, 0.008790969848632812, 0.012393951416015625, 0.015996932983398438, 0.01959991455078125, 0.023202896118164062, 0.026805877685546875, 0.030408859252929688, 0.0340118408203125, 0.03761482238769531, 0.041217803955078125, 0.04482078552246094, 0.04842376708984375, 0.05202674865722656, 0.055629730224609375, 0.05923271179199219, 0.062835693359375, 0.06643867492675781, 0.07004165649414062, 0.07364463806152344, 0.07724761962890625, 0.08085060119628906, 0.08445358276367188, 0.08805656433105469, 0.0916595458984375, 0.09526252746582031, 0.09886550903320312, 0.10246849060058594, 0.10607147216796875, 0.10967445373535156, 0.11327743530273438, 0.11688041687011719, 0.1204833984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 10.0, 9.0, 14.0, 15.0, 16.0, 15.0, 35.0, 36.0, 50.0, 39.0, 72.0, 73.0, 74.0, 76.0, 68.0, 68.0, 55.0, 54.0, 45.0, 27.0, 28.0, 20.0, 17.0, 18.0, 11.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0013179779052734375, -0.0012768656015396118, -0.0012357532978057861, -0.0011946409940719604, -0.0011535286903381348, -0.001112416386604309, -0.0010713040828704834, -0.0010301917791366577, -0.000989079475402832, -0.0009479671716690063, -0.0009068548679351807, -0.000865742564201355, -0.0008246302604675293, -0.0007835179567337036, -0.0007424056529998779, -0.0007012933492660522, -0.0006601810455322266, -0.0006190687417984009, -0.0005779564380645752, -0.0005368441343307495, -0.0004957318305969238, -0.00045461952686309814, -0.00041350722312927246, -0.0003723949193954468, -0.0003312826156616211, -0.0002901703119277954, -0.0002490580081939697, -0.00020794570446014404, -0.00016683340072631836, -0.00012572109699249268, -8.460879325866699e-05, -4.349648952484131e-05, -2.384185791015625e-06, 3.872811794281006e-05, 7.984042167663574e-05, 0.00012095272541046143, 0.0001620650291442871, 0.0002031773328781128, 0.0002442896366119385, 0.00028540194034576416, 0.00032651424407958984, 0.00036762654781341553, 0.0004087388515472412, 0.0004498511552810669, 0.0004909634590148926, 0.0005320757627487183, 0.0005731880664825439, 0.0006143003702163696, 0.0006554126739501953, 0.000696524977684021, 0.0007376372814178467, 0.0007787495851516724, 0.000819861888885498, 0.0008609741926193237, 0.0009020864963531494, 0.0009431988000869751, 0.0009843111038208008, 0.0010254234075546265, 0.0010665357112884521, 0.0011076480150222778, 0.0011487603187561035, 0.0011898726224899292, 0.0012309849262237549, 0.0012720972299575806, 0.0013132095336914062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 10.0, 10.0, 14.0, 21.0, 23.0, 34.0, 35.0, 66.0, 116.0, 206.0, 445.0, 1739.0, 931753.0, 112000.0, 1200.0, 391.0, 164.0, 77.0, 75.0, 40.0, 18.0, 23.0, 15.0, 15.0, 9.0, 10.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.026988983154296875, -0.02611541748046875, -0.025241851806640625, -0.0243682861328125, -0.023494720458984375, -0.02262115478515625, -0.021747589111328125, -0.0208740234375, -0.020000457763671875, -0.01912689208984375, -0.018253326416015625, -0.0173797607421875, -0.016506195068359375, -0.01563262939453125, -0.014759063720703125, -0.013885498046875, -0.013011932373046875, -0.01213836669921875, -0.011264801025390625, -0.0103912353515625, -0.009517669677734375, -0.00864410400390625, -0.007770538330078125, -0.00689697265625, -0.006023406982421875, -0.00514984130859375, -0.004276275634765625, -0.0034027099609375, -0.002529144287109375, -0.00165557861328125, -0.000782012939453125, 9.1552734375e-05, 0.000965118408203125, 0.00183868408203125, 0.002712249755859375, 0.0035858154296875, 0.004459381103515625, 0.00533294677734375, 0.006206512451171875, 0.007080078125, 0.007953643798828125, 0.00882720947265625, 0.009700775146484375, 0.0105743408203125, 0.011447906494140625, 0.01232147216796875, 0.013195037841796875, 0.014068603515625, 0.014942169189453125, 0.01581573486328125, 0.016689300537109375, 0.0175628662109375, 0.018436431884765625, 0.01930999755859375, 0.020183563232421875, 0.02105712890625, 0.021930694580078125, 0.02280426025390625, 0.023677825927734375, 0.0245513916015625, 0.025424957275390625, 0.02629852294921875, 0.027172088623046875, 0.028045654296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 28.0, 967.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03016747534275055, -0.02961399033665657, -0.029060503467917442, -0.028507018461823463, -0.027953531593084335, -0.027400046586990356, -0.02684655971825123, -0.02629307471215725, -0.02573958784341812, -0.025186102837324142, -0.024632615968585014, -0.024079130962491035, -0.023525644093751907, -0.02297215908765793, -0.0224186722189188, -0.02186518721282482, -0.021311702206730843, -0.020758217200636864, -0.020204730331897736, -0.019651245325803757, -0.01909775845706463, -0.01854427345097065, -0.01799078658223152, -0.017437301576137543, -0.016883816570043564, -0.016330331563949585, -0.015776844695210457, -0.015223358757793903, -0.01466987282037735, -0.014116387814283371, -0.013562901876866817, -0.013009415939450264, -0.012455929070711136, -0.011902443133294582, -0.011348957195878029, -0.010795471258461475, -0.010241985321044922, -0.009688500314950943, -0.00913501437753439, -0.008581528440117836, -0.008028042502701283, -0.007474556565284729, -0.0069210706278681755, -0.006367585156112909, -0.005814099218696356, -0.005260613281279802, -0.004707127809524536, -0.004153641872107983, -0.003600155934691429, -0.0030466699972748756, -0.002493184292688966, -0.0019396984716877341, -0.0013862126506865025, -0.000832726713269949, -0.0002792410086840391, 0.00027424469590187073, 0.0008277306333184242, 0.001381216454319656, 0.0019347022753208876, 0.0024881879799067974, 0.003041673917323351, 0.0035951598547399044, 0.004148645326495171, 0.004702131263911724, 0.005255617201328278]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 8.0, 8.0, 17.0, 21.0, 17.0, 25.0, 25.0, 28.0, 37.0, 47.0, 36.0, 37.0, 41.0, 44.0, 36.0, 47.0, 44.0, 53.0, 50.0, 39.0, 50.0, 28.0, 41.0, 26.0, 26.0, 27.0, 25.0, 15.0, 18.0, 10.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010303258895874023, -0.0009916974231600761, -0.0009530689567327499, -0.0009144404903054237, -0.0008758120238780975, -0.0008371835574507713, -0.0007985550910234451, -0.0007599266245961189, -0.0007212981581687927, -0.0006826696917414665, -0.0006440412253141403, -0.0006054127588868141, -0.0005667842924594879, -0.0005281558260321617, -0.0004895273596048355, -0.0004508988931775093, -0.0004122704267501831, -0.0003736419603228569, -0.0003350134938955307, -0.0002963850274682045, -0.0002577565610408783, -0.0002191280946135521, -0.0001804996281862259, -0.0001418711617588997, -0.00010324269533157349, -6.461422890424728e-05, -2.598576247692108e-05, 1.2642703950405121e-05, 5.127117037773132e-05, 8.989963680505753e-05, 0.00012852810323238373, 0.00016715656965970993, 0.00020578503608703613, 0.00024441350251436234, 0.00028304196894168854, 0.00032167043536901474, 0.00036029890179634094, 0.00039892736822366714, 0.00043755583465099335, 0.00047618430107831955, 0.0005148127675056458, 0.000553441233932972, 0.0005920697003602982, 0.0006306981667876244, 0.0006693266332149506, 0.0007079550996422768, 0.000746583566069603, 0.0007852120324969292, 0.0008238404989242554, 0.0008624689653515816, 0.0009010974317789078, 0.000939725898206234, 0.0009783543646335602, 0.0010169828310608864, 0.0010556112974882126, 0.0010942397639155388, 0.001132868230342865, 0.0011714966967701912, 0.0012101251631975174, 0.0012487536296248436, 0.0012873820960521698, 0.001326010562479496, 0.0013646390289068222, 0.0014032674953341484, 0.0014418959617614746]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 18.0, 20.0, 27.0, 33.0, 52.0, 66.0, 106.0, 152.0, 215.0, 267.0, 434.0, 598.0, 917.0, 1269.0, 2167.0, 3378.0, 5230.0, 8896.0, 16607.0, 39525.0, 225401.0, 622552.0, 68457.0, 22757.0, 11284.0, 6499.0, 3900.0, 2588.0, 1620.0, 1113.0, 718.0, 507.0, 368.0, 247.0, 182.0, 103.0, 96.0, 48.0, 37.0, 29.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.787109375, -18.12109375, -17.455078125, -16.7890625, -16.123046875, -15.45703125, -14.791015625, -14.125, -13.458984375, -12.79296875, -12.126953125, -11.4609375, -10.794921875, -10.12890625, -9.462890625, -8.796875, -8.130859375, -7.46484375, -6.798828125, -6.1328125, -5.466796875, -4.80078125, -4.134765625, -3.46875, -2.802734375, -2.13671875, -1.470703125, -0.8046875, -0.138671875, 0.52734375, 1.193359375, 1.859375, 2.525390625, 3.19140625, 3.857421875, 4.5234375, 5.189453125, 5.85546875, 6.521484375, 7.1875, 7.853515625, 8.51953125, 9.185546875, 9.8515625, 10.517578125, 11.18359375, 11.849609375, 12.515625, 13.181640625, 13.84765625, 14.513671875, 15.1796875, 15.845703125, 16.51171875, 17.177734375, 17.84375, 18.509765625, 19.17578125, 19.841796875, 20.5078125, 21.173828125, 21.83984375, 22.505859375, 23.171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 4.0, 6.0, 8.0, 6.0, 11.0, 16.0, 17.0, 13.0, 22.0, 21.0, 29.0, 32.0, 37.0, 34.0, 39.0, 39.0, 54.0, 58.0, 104.0, 287.0, 1579.0, 138.0, 70.0, 43.0, 34.0, 42.0, 32.0, 29.0, 33.0, 25.0, 23.0, 17.0, 19.0, 23.0, 10.0, 17.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-30.859375, -29.956298828125, -29.05322265625, -28.150146484375, -27.2470703125, -26.343994140625, -25.44091796875, -24.537841796875, -23.634765625, -22.731689453125, -21.82861328125, -20.925537109375, -20.0224609375, -19.119384765625, -18.21630859375, -17.313232421875, -16.41015625, -15.507080078125, -14.60400390625, -13.700927734375, -12.7978515625, -11.894775390625, -10.99169921875, -10.088623046875, -9.185546875, -8.282470703125, -7.37939453125, -6.476318359375, -5.5732421875, -4.670166015625, -3.76708984375, -2.864013671875, -1.9609375, -1.057861328125, -0.15478515625, 0.748291015625, 1.6513671875, 2.554443359375, 3.45751953125, 4.360595703125, 5.263671875, 6.166748046875, 7.06982421875, 7.972900390625, 8.8759765625, 9.779052734375, 10.68212890625, 11.585205078125, 12.48828125, 13.391357421875, 14.29443359375, 15.197509765625, 16.1005859375, 17.003662109375, 17.90673828125, 18.809814453125, 19.712890625, 20.615966796875, 21.51904296875, 22.422119140625, 23.3251953125, 24.228271484375, 25.13134765625, 26.034423828125, 26.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 3.0, 6.0, 5.0, 4.0, 2.0, 10.0, 8.0, 9.0, 2.0, 17.0, 13.0, 18.0, 30.0, 24.0, 27.0, 37.0, 45.0, 54.0, 91.0, 123.0, 243.0, 454.0, 1152.0, 3349.0, 12321.0, 88925.0, 2947977.0, 73954.0, 11136.0, 3324.0, 1153.0, 433.0, 201.0, 134.0, 92.0, 68.0, 50.0, 38.0, 26.0, 30.0, 18.0, 16.0, 22.0, 15.0, 9.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-49.90625, -48.1533203125, -46.400390625, -44.6474609375, -42.89453125, -41.1416015625, -39.388671875, -37.6357421875, -35.8828125, -34.1298828125, -32.376953125, -30.6240234375, -28.87109375, -27.1181640625, -25.365234375, -23.6123046875, -21.859375, -20.1064453125, -18.353515625, -16.6005859375, -14.84765625, -13.0947265625, -11.341796875, -9.5888671875, -7.8359375, -6.0830078125, -4.330078125, -2.5771484375, -0.82421875, 0.9287109375, 2.681640625, 4.4345703125, 6.1875, 7.9404296875, 9.693359375, 11.4462890625, 13.19921875, 14.9521484375, 16.705078125, 18.4580078125, 20.2109375, 21.9638671875, 23.716796875, 25.4697265625, 27.22265625, 28.9755859375, 30.728515625, 32.4814453125, 34.234375, 35.9873046875, 37.740234375, 39.4931640625, 41.24609375, 42.9990234375, 44.751953125, 46.5048828125, 48.2578125, 50.0107421875, 51.763671875, 53.5166015625, 55.26953125, 57.0224609375, 58.775390625, 60.5283203125, 62.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 33.0, 162.0, 486.0, 261.0, 59.0, 11.0], "bins": [-482.2396240234375, -474.2826232910156, -466.32562255859375, -458.36865234375, -450.4116516113281, -442.45465087890625, -434.4976501464844, -426.5406799316406, -418.58367919921875, -410.6266784667969, -402.669677734375, -394.71270751953125, -386.7557067871094, -378.7987060546875, -370.8417053222656, -362.8847351074219, -354.927734375, -346.9707336425781, -339.01373291015625, -331.0567626953125, -323.0997619628906, -315.14276123046875, -307.1857604980469, -299.2287902832031, -291.27178955078125, -283.3147888183594, -275.3577880859375, -267.40081787109375, -259.4438171386719, -251.48681640625, -243.5298309326172, -235.5728302001953, -227.61582946777344, -219.65882873535156, -211.70184326171875, -203.74484252929688, -195.78785705566406, -187.8308563232422, -179.87387084960938, -171.9168701171875, -163.9598846435547, -156.0028839111328, -148.0458984375, -140.08889770507812, -132.1319122314453, -124.17491149902344, -116.21792602539062, -108.26092529296875, -100.3039321899414, -92.34693908691406, -84.38994598388672, -76.43295288085938, -68.47595977783203, -60.51896286010742, -52.56196975708008, -44.604976654052734, -36.64798355102539, -28.690990447998047, -20.733997344970703, -12.777002334594727, -4.820009231567383, 3.1369857788085938, 11.093978881835938, 19.05097198486328, 27.007965087890625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 11.0, 18.0, 27.0, 24.0, 14.0, 31.0, 37.0, 30.0, 35.0, 38.0, 43.0, 55.0, 46.0, 44.0, 46.0, 44.0, 45.0, 41.0, 37.0, 29.0, 28.0, 33.0, 43.0, 29.0, 21.0, 19.0, 17.0, 22.0, 4.0, 14.0, 7.0, 10.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.95658111572266, -89.61892700195312, -86.28126525878906, -82.94361114501953, -79.60595703125, -76.26829528808594, -72.9306411743164, -69.59298706054688, -66.25532531738281, -62.917667388916016, -59.58000946044922, -56.24235534667969, -52.90469741821289, -49.567039489746094, -46.22938537597656, -42.891727447509766, -39.55406951904297, -36.21641159057617, -32.878753662109375, -29.541099548339844, -26.203441619873047, -22.86578369140625, -19.528127670288086, -16.190471649169922, -12.852813720703125, -9.515156745910645, -6.177499771118164, -2.8398427963256836, 0.4978141784667969, 3.8354721069335938, 7.173128128051758, 10.510784149169922, 13.84844970703125, 17.186107635498047, 20.52376365661621, 23.861419677734375, 27.199077606201172, 30.53673553466797, 33.8743896484375, 37.2120475769043, 40.549705505371094, 43.88736343383789, 47.22502136230469, 50.56267547607422, 53.900333404541016, 57.23799133300781, 60.575645446777344, 63.91330337524414, 67.25096130371094, 70.58861541748047, 73.92627716064453, 77.26393127441406, 80.60159301757812, 83.93924713134766, 87.27690124511719, 90.61456298828125, 93.95221710205078, 97.28987121582031, 100.62753295898438, 103.9651870727539, 107.30284118652344, 110.6405029296875, 113.97815704345703, 117.31581115722656, 120.65347290039062]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 8.0, 12.0, 10.0, 14.0, 12.0, 15.0, 18.0, 25.0, 20.0, 28.0, 33.0, 38.0, 24.0, 34.0, 37.0, 41.0, 47.0, 37.0, 46.0, 31.0, 38.0, 32.0, 29.0, 40.0, 55.0, 26.0, 35.0, 34.0, 18.0, 20.0, 15.0, 13.0, 14.0, 17.0, 19.0, 9.0, 6.0, 6.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.03125, -10.7103271484375, -10.389404296875, -10.0684814453125, -9.74755859375, -9.4266357421875, -9.105712890625, -8.7847900390625, -8.4638671875, -8.1429443359375, -7.822021484375, -7.5010986328125, -7.18017578125, -6.8592529296875, -6.538330078125, -6.2174072265625, -5.896484375, -5.5755615234375, -5.254638671875, -4.9337158203125, -4.61279296875, -4.2918701171875, -3.970947265625, -3.6500244140625, -3.3291015625, -3.0081787109375, -2.687255859375, -2.3663330078125, -2.04541015625, -1.7244873046875, -1.403564453125, -1.0826416015625, -0.76171875, -0.4407958984375, -0.119873046875, 0.2010498046875, 0.52197265625, 0.8428955078125, 1.163818359375, 1.4847412109375, 1.8056640625, 2.1265869140625, 2.447509765625, 2.7684326171875, 3.08935546875, 3.4102783203125, 3.731201171875, 4.0521240234375, 4.373046875, 4.6939697265625, 5.014892578125, 5.3358154296875, 5.65673828125, 5.9776611328125, 6.298583984375, 6.6195068359375, 6.9404296875, 7.2613525390625, 7.582275390625, 7.9031982421875, 8.22412109375, 8.5450439453125, 8.865966796875, 9.1868896484375, 9.5078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 10.0, 15.0, 13.0, 9.0, 17.0, 19.0, 20.0, 34.0, 55.0, 82.0, 154.0, 246.0, 432.0, 856.0, 1734.0, 3905.0, 9767.0, 33470.0, 564452.0, 3260179.0, 280625.0, 24716.0, 7663.0, 3050.0, 1313.0, 612.0, 321.0, 161.0, 92.0, 56.0, 40.0, 34.0, 21.0, 13.0, 21.0, 12.0, 11.0, 9.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.25, -34.22509765625, -33.2001953125, -32.17529296875, -31.150390625, -30.12548828125, -29.1005859375, -28.07568359375, -27.05078125, -26.02587890625, -25.0009765625, -23.97607421875, -22.951171875, -21.92626953125, -20.9013671875, -19.87646484375, -18.8515625, -17.82666015625, -16.8017578125, -15.77685546875, -14.751953125, -13.72705078125, -12.7021484375, -11.67724609375, -10.65234375, -9.62744140625, -8.6025390625, -7.57763671875, -6.552734375, -5.52783203125, -4.5029296875, -3.47802734375, -2.453125, -1.42822265625, -0.4033203125, 0.62158203125, 1.646484375, 2.67138671875, 3.6962890625, 4.72119140625, 5.74609375, 6.77099609375, 7.7958984375, 8.82080078125, 9.845703125, 10.87060546875, 11.8955078125, 12.92041015625, 13.9453125, 14.97021484375, 15.9951171875, 17.02001953125, 18.044921875, 19.06982421875, 20.0947265625, 21.11962890625, 22.14453125, 23.16943359375, 24.1943359375, 25.21923828125, 26.244140625, 27.26904296875, 28.2939453125, 29.31884765625, 30.34375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 7.0, 6.0, 18.0, 8.0, 19.0, 24.0, 26.0, 37.0, 44.0, 69.0, 123.0, 141.0, 255.0, 444.0, 656.0, 797.0, 564.0, 310.0, 168.0, 106.0, 61.0, 36.0, 32.0, 25.0, 15.0, 18.0, 9.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.296875, -23.5146484375, -22.732421875, -21.9501953125, -21.16796875, -20.3857421875, -19.603515625, -18.8212890625, -18.0390625, -17.2568359375, -16.474609375, -15.6923828125, -14.91015625, -14.1279296875, -13.345703125, -12.5634765625, -11.78125, -10.9990234375, -10.216796875, -9.4345703125, -8.65234375, -7.8701171875, -7.087890625, -6.3056640625, -5.5234375, -4.7412109375, -3.958984375, -3.1767578125, -2.39453125, -1.6123046875, -0.830078125, -0.0478515625, 0.734375, 1.5166015625, 2.298828125, 3.0810546875, 3.86328125, 4.6455078125, 5.427734375, 6.2099609375, 6.9921875, 7.7744140625, 8.556640625, 9.3388671875, 10.12109375, 10.9033203125, 11.685546875, 12.4677734375, 13.25, 14.0322265625, 14.814453125, 15.5966796875, 16.37890625, 17.1611328125, 17.943359375, 18.7255859375, 19.5078125, 20.2900390625, 21.072265625, 21.8544921875, 22.63671875, 23.4189453125, 24.201171875, 24.9833984375, 25.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 10.0, 16.0, 17.0, 28.0, 35.0, 70.0, 118.0, 289.0, 926.0, 3886.0, 34057.0, 3632592.0, 504462.0, 14393.0, 2196.0, 577.0, 221.0, 128.0, 54.0, 36.0, 34.0, 22.0, 16.0, 13.0, 16.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-92.5625, -89.7431640625, -86.923828125, -84.1044921875, -81.28515625, -78.4658203125, -75.646484375, -72.8271484375, -70.0078125, -67.1884765625, -64.369140625, -61.5498046875, -58.73046875, -55.9111328125, -53.091796875, -50.2724609375, -47.453125, -44.6337890625, -41.814453125, -38.9951171875, -36.17578125, -33.3564453125, -30.537109375, -27.7177734375, -24.8984375, -22.0791015625, -19.259765625, -16.4404296875, -13.62109375, -10.8017578125, -7.982421875, -5.1630859375, -2.34375, 0.4755859375, 3.294921875, 6.1142578125, 8.93359375, 11.7529296875, 14.572265625, 17.3916015625, 20.2109375, 23.0302734375, 25.849609375, 28.6689453125, 31.48828125, 34.3076171875, 37.126953125, 39.9462890625, 42.765625, 45.5849609375, 48.404296875, 51.2236328125, 54.04296875, 56.8623046875, 59.681640625, 62.5009765625, 65.3203125, 68.1396484375, 70.958984375, 73.7783203125, 76.59765625, 79.4169921875, 82.236328125, 85.0556640625, 87.875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 22.0, 62.0, 279.0, 402.0, 168.0, 58.0, 16.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.2228393554688, -556.716796875, -545.2108154296875, -533.7047729492188, -522.19873046875, -510.6927490234375, -499.18670654296875, -487.6806945800781, -476.1746826171875, -464.6686706542969, -453.1626281738281, -441.6566162109375, -430.1506042480469, -418.64459228515625, -407.1385498046875, -395.6325378417969, -384.1264953613281, -372.6204833984375, -361.11444091796875, -349.6084289550781, -338.1024169921875, -326.59637451171875, -315.0903625488281, -303.5843505859375, -292.07830810546875, -280.5722961425781, -269.0662536621094, -257.56024169921875, -246.05422973632812, -234.54820251464844, -223.04217529296875, -211.53616333007812, -200.03016662597656, -188.52413940429688, -177.01812744140625, -165.51210021972656, -154.00607299804688, -142.50006103515625, -130.99403381347656, -119.4880142211914, -107.98199462890625, -96.4759750366211, -84.96995544433594, -73.46392822265625, -61.957908630371094, -50.45188903808594, -38.94586181640625, -27.439842224121094, -15.933822631835938, -4.427801132202148, 7.078220367431641, 18.584243774414062, 30.09026336669922, 41.596282958984375, 53.10231018066406, 64.60832977294922, 76.11434936523438, 87.62036895751953, 99.12638854980469, 110.63241577148438, 122.13843536376953, 133.6444549560547, 145.15048217773438, 156.656494140625, 168.1625213623047]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 12.0, 9.0, 10.0, 8.0, 15.0, 13.0, 10.0, 24.0, 21.0, 13.0, 30.0, 16.0, 20.0, 28.0, 26.0, 29.0, 44.0, 39.0, 36.0, 46.0, 24.0, 37.0, 31.0, 33.0, 41.0, 29.0, 48.0, 37.0, 35.0, 31.0, 28.0, 22.0, 25.0, 18.0, 21.0, 16.0, 16.0, 6.0, 15.0, 3.0, 13.0, 6.0, 2.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-74.22453308105469, -72.0906982421875, -69.95685577392578, -67.8230209350586, -65.6891860961914, -63.55534744262695, -61.4215087890625, -59.28767395019531, -57.15383529663086, -55.019996643066406, -52.88616180419922, -50.752323150634766, -48.61848449707031, -46.484649658203125, -44.35081100463867, -42.21697235107422, -40.08313751220703, -37.94929885864258, -35.81546401977539, -33.68162536621094, -31.547788619995117, -29.413951873779297, -27.280113220214844, -25.146276473999023, -23.012439727783203, -20.878602981567383, -18.744766235351562, -16.61092758178711, -14.477090835571289, -12.343254089355469, -10.209416389465332, -8.075578689575195, -5.941741943359375, -3.8079047203063965, -1.674067497253418, 0.45976972579956055, 2.593606948852539, 4.727443695068359, 6.861281394958496, 8.995119094848633, 11.128955841064453, 13.262792587280273, 15.39663028717041, 17.530467987060547, 19.664304733276367, 21.798141479492188, 23.93198013305664, 26.06581687927246, 28.19965362548828, 30.3334903717041, 32.46732711791992, 34.601165771484375, 36.73500061035156, 38.868839263916016, 41.00267791748047, 43.136512756347656, 45.27035140991211, 47.40419006347656, 49.53802490234375, 51.6718635559082, 53.805702209472656, 55.939537048339844, 58.0733757019043, 60.20721435546875, 62.34104919433594]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 8.0, 26.0, 27.0, 45.0, 75.0, 111.0, 137.0, 224.0, 311.0, 401.0, 711.0, 971.0, 1532.0, 2163.0, 3288.0, 4933.0, 7351.0, 11536.0, 18125.0, 27815.0, 43626.0, 69351.0, 113528.0, 181669.0, 204458.0, 132235.0, 81488.0, 50587.0, 32094.0, 20744.0, 13403.0, 8697.0, 5718.0, 3680.0, 2470.0, 1582.0, 1136.0, 773.0, 475.0, 324.0, 225.0, 163.0, 116.0, 74.0, 45.0, 30.0, 22.0, 17.0, 8.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22259140014648438, -0.21495819091796875, -0.20732498168945312, -0.1996917724609375, -0.19205856323242188, -0.18442535400390625, -0.17679214477539062, -0.169158935546875, -0.16152572631835938, -0.15389251708984375, -0.14625930786132812, -0.1386260986328125, -0.13099288940429688, -0.12335968017578125, -0.11572647094726562, -0.10809326171875, -0.10046005249023438, -0.09282684326171875, -0.08519363403320312, -0.0775604248046875, -0.06992721557617188, -0.06229400634765625, -0.054660797119140625, -0.047027587890625, -0.039394378662109375, -0.03176116943359375, -0.024127960205078125, -0.0164947509765625, -0.008861541748046875, -0.00122833251953125, 0.006404876708984375, 0.0140380859375, 0.021671295166015625, 0.02930450439453125, 0.036937713623046875, 0.0445709228515625, 0.052204132080078125, 0.05983734130859375, 0.06747055053710938, 0.075103759765625, 0.08273696899414062, 0.09037017822265625, 0.09800338745117188, 0.1056365966796875, 0.11326980590820312, 0.12090301513671875, 0.12853622436523438, 0.13616943359375, 0.14380264282226562, 0.15143585205078125, 0.15906906127929688, 0.1667022705078125, 0.17433547973632812, 0.18196868896484375, 0.18960189819335938, 0.197235107421875, 0.20486831665039062, 0.21250152587890625, 0.22013473510742188, 0.2277679443359375, 0.23540115356445312, 0.24303436279296875, 0.2506675720214844, 0.25830078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 11.0, 4.0, 10.0, 11.0, 15.0, 10.0, 23.0, 24.0, 27.0, 18.0, 28.0, 44.0, 31.0, 45.0, 41.0, 44.0, 37.0, 38.0, 38.0, 1063.0, 49.0, 43.0, 34.0, 39.0, 37.0, 39.0, 32.0, 24.0, 24.0, 18.0, 20.0, 15.0, 19.0, 10.0, 12.0, 12.0, 9.0, 8.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6976318359375, -7.434326171875, -7.1710205078125, -6.90771484375, -6.6444091796875, -6.381103515625, -6.1177978515625, -5.8544921875, -5.5911865234375, -5.327880859375, -5.0645751953125, -4.80126953125, -4.5379638671875, -4.274658203125, -4.0113525390625, -3.748046875, -3.4847412109375, -3.221435546875, -2.9581298828125, -2.69482421875, -2.4315185546875, -2.168212890625, -1.9049072265625, -1.6416015625, -1.3782958984375, -1.114990234375, -0.8516845703125, -0.58837890625, -0.3250732421875, -0.061767578125, 0.2015380859375, 0.46484375, 0.7281494140625, 0.991455078125, 1.2547607421875, 1.51806640625, 1.7813720703125, 2.044677734375, 2.3079833984375, 2.5712890625, 2.8345947265625, 3.097900390625, 3.3612060546875, 3.62451171875, 3.8878173828125, 4.151123046875, 4.4144287109375, 4.677734375, 4.9410400390625, 5.204345703125, 5.4676513671875, 5.73095703125, 5.9942626953125, 6.257568359375, 6.5208740234375, 6.7841796875, 7.0474853515625, 7.310791015625, 7.5740966796875, 7.83740234375, 8.1007080078125, 8.364013671875, 8.6273193359375, 8.890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 19.0, 17.0, 24.0, 41.0, 91.0, 97.0, 142.0, 200.0, 311.0, 472.0, 639.0, 1054.0, 1389.0, 2194.0, 3200.0, 4898.0, 7488.0, 11487.0, 17695.0, 27607.0, 43115.0, 68410.0, 111839.0, 190023.0, 1256078.0, 129643.0, 79537.0, 49504.0, 31792.0, 20409.0, 12986.0, 8249.0, 5482.0, 3626.0, 2380.0, 1547.0, 1063.0, 693.0, 556.0, 360.0, 237.0, 173.0, 117.0, 67.0, 53.0, 47.0, 25.0, 15.0, 11.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.12237548828125, -0.11856842041015625, -0.1147613525390625, -0.11095428466796875, -0.107147216796875, -0.10334014892578125, -0.0995330810546875, -0.09572601318359375, -0.0919189453125, -0.08811187744140625, -0.0843048095703125, -0.08049774169921875, -0.076690673828125, -0.07288360595703125, -0.0690765380859375, -0.06526947021484375, -0.06146240234375, -0.05765533447265625, -0.0538482666015625, -0.05004119873046875, -0.046234130859375, -0.04242706298828125, -0.0386199951171875, -0.03481292724609375, -0.031005859375, -0.02719879150390625, -0.0233917236328125, -0.01958465576171875, -0.015777587890625, -0.01197052001953125, -0.0081634521484375, -0.00435638427734375, -0.00054931640625, 0.00325775146484375, 0.0070648193359375, 0.01087188720703125, 0.014678955078125, 0.01848602294921875, 0.0222930908203125, 0.02610015869140625, 0.0299072265625, 0.03371429443359375, 0.0375213623046875, 0.04132843017578125, 0.045135498046875, 0.04894256591796875, 0.0527496337890625, 0.05655670166015625, 0.06036376953125, 0.06417083740234375, 0.0679779052734375, 0.07178497314453125, 0.075592041015625, 0.07939910888671875, 0.0832061767578125, 0.08701324462890625, 0.0908203125, 0.09462738037109375, 0.0984344482421875, 0.10224151611328125, 0.106048583984375, 0.10985565185546875, 0.1136627197265625, 0.11746978759765625, 0.12127685546875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 17.0, 23.0, 18.0, 20.0, 22.0, 25.0, 37.0, 41.0, 44.0, 47.0, 54.0, 63.0, 55.0, 56.0, 57.0, 55.0, 44.0, 36.0, 40.0, 28.0, 35.0, 20.0, 18.0, 17.0, 20.0, 13.0, 6.0, 7.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011873245239257812, -0.0011524409055709839, -0.0011175572872161865, -0.0010826736688613892, -0.0010477900505065918, -0.0010129064321517944, -0.000978022813796997, -0.0009431391954421997, -0.0009082555770874023, -0.000873371958732605, -0.0008384883403778076, -0.0008036047220230103, -0.0007687211036682129, -0.0007338374853134155, -0.0006989538669586182, -0.0006640702486038208, -0.0006291866302490234, -0.0005943030118942261, -0.0005594193935394287, -0.0005245357751846313, -0.000489652156829834, -0.0004547685384750366, -0.00041988492012023926, -0.0003850013017654419, -0.00035011768341064453, -0.00031523406505584717, -0.0002803504467010498, -0.00024546682834625244, -0.00021058320999145508, -0.00017569959163665771, -0.00014081597328186035, -0.00010593235492706299, -7.104873657226562e-05, -3.616511821746826e-05, -1.2814998626708984e-06, 3.3602118492126465e-05, 6.848573684692383e-05, 0.00010336935520172119, 0.00013825297355651855, 0.00017313659191131592, 0.00020802021026611328, 0.00024290382862091064, 0.000277787446975708, 0.00031267106533050537, 0.00034755468368530273, 0.0003824383020401001, 0.00041732192039489746, 0.0004522055387496948, 0.0004870891571044922, 0.0005219727754592896, 0.0005568563938140869, 0.0005917400121688843, 0.0006266236305236816, 0.000661507248878479, 0.0006963908672332764, 0.0007312744855880737, 0.0007661581039428711, 0.0008010417222976685, 0.0008359253406524658, 0.0008708089590072632, 0.0009056925773620605, 0.0009405761957168579, 0.0009754598140716553, 0.0010103434324264526, 0.00104522705078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 8.0, 11.0, 19.0, 17.0, 18.0, 21.0, 35.0, 32.0, 55.0, 91.0, 186.0, 503.0, 1515.0, 636541.0, 407003.0, 1444.0, 458.0, 190.0, 98.0, 50.0, 40.0, 26.0, 25.0, 22.0, 17.0, 22.0, 15.0, 19.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230712890625, -0.022301912307739258, -0.021532535552978516, -0.020763158798217773, -0.01999378204345703, -0.01922440528869629, -0.018455028533935547, -0.017685651779174805, -0.016916275024414062, -0.01614689826965332, -0.015377521514892578, -0.014608144760131836, -0.013838768005371094, -0.013069391250610352, -0.01230001449584961, -0.011530637741088867, -0.010761260986328125, -0.009991884231567383, -0.00922250747680664, -0.008453130722045898, -0.007683753967285156, -0.006914377212524414, -0.006145000457763672, -0.00537562370300293, -0.0046062469482421875, -0.0038368701934814453, -0.003067493438720703, -0.002298116683959961, -0.0015287399291992188, -0.0007593631744384766, 1.0013580322265625e-05, 0.0007793903350830078, 0.00154876708984375, 0.002318143844604492, 0.0030875205993652344, 0.0038568973541259766, 0.004626274108886719, 0.005395650863647461, 0.006165027618408203, 0.006934404373168945, 0.0077037811279296875, 0.00847315788269043, 0.009242534637451172, 0.010011911392211914, 0.010781288146972656, 0.011550664901733398, 0.01232004165649414, 0.013089418411254883, 0.013858795166015625, 0.014628171920776367, 0.01539754867553711, 0.01616692543029785, 0.016936302185058594, 0.017705678939819336, 0.018475055694580078, 0.01924443244934082, 0.020013809204101562, 0.020783185958862305, 0.021552562713623047, 0.02232193946838379, 0.02309131622314453, 0.023860692977905273, 0.024630069732666016, 0.025399446487426758, 0.0261688232421875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 995.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04389767348766327, -0.04310816153883934, -0.04231865331530571, -0.04152914136648178, -0.04073963314294815, -0.03995012119412422, -0.03916060924530029, -0.03837110102176666, -0.037581589072942734, -0.036792077124118805, -0.036002568900585175, -0.035213056951761246, -0.03442354500293732, -0.033634036779403687, -0.03284452483057976, -0.03205501660704613, -0.0312655046582222, -0.03047599457204342, -0.02968648448586464, -0.02889697253704071, -0.02810746245086193, -0.02731795236468315, -0.026528440415859222, -0.025738930329680443, -0.024949420243501663, -0.024159910157322884, -0.023370400071144104, -0.022580888122320175, -0.021791378036141396, -0.021001867949962616, -0.020212356001138687, -0.019422845914959908, -0.018633335828781128, -0.01784382574260235, -0.01705431565642357, -0.01626480370759964, -0.01547529362142086, -0.01468578353524208, -0.013896272517740726, -0.013106761500239372, -0.012317251414060593, -0.011527741327881813, -0.010738230310380459, -0.009948719292879105, -0.009159209206700325, -0.008369699120521545, -0.007580188103020191, -0.006790677551180124, -0.00600116653367877, -0.005211655981838703, -0.004422145429998636, -0.0036326348781585693, -0.0028431243263185024, -0.0020536137744784355, -0.0012641032226383686, -0.0004745926707983017, 0.0003149178810417652, 0.0011044284328818321, 0.001893938984721899, 0.002683449536561966, 0.003472960088402033, 0.0042624706402421, 0.005051981192082167, 0.005841491743922234, 0.0066310022957623005]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 7.0, 10.0, 14.0, 16.0, 30.0, 32.0, 31.0, 37.0, 46.0, 50.0, 51.0, 54.0, 52.0, 57.0, 47.0, 57.0, 49.0, 54.0, 52.0, 44.0, 27.0, 41.0, 25.0, 25.0, 26.0, 12.0, 11.0, 13.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968016624450684, -0.001146787777543068, -0.0010967738926410675, -0.001046760007739067, -0.0009967461228370667, -0.0009467322379350662, -0.0008967183530330658, -0.0008467044681310654, -0.0007966905832290649, -0.0007466766983270645, -0.0006966628134250641, -0.0006466489285230637, -0.0005966350436210632, -0.0005466211587190628, -0.0004966072738170624, -0.00044659338891506195, -0.0003965795040130615, -0.0003465656191110611, -0.00029655173420906067, -0.00024653784930706024, -0.00019652396440505981, -0.0001465100795030594, -9.649619460105896e-05, -4.648230969905853e-05, 3.5315752029418945e-06, 5.354546010494232e-05, 0.00010355934500694275, 0.00015357322990894318, 0.0002035871148109436, 0.00025360099971294403, 0.00030361488461494446, 0.0003536287695169449, 0.0004036426544189453, 0.00045365653932094574, 0.0005036704242229462, 0.0005536843091249466, 0.000603698194026947, 0.0006537120789289474, 0.0007037259638309479, 0.0007537398487329483, 0.0008037537336349487, 0.0008537676185369492, 0.0009037815034389496, 0.00095379538834095, 0.0010038092732429504, 0.0010538231581449509, 0.0011038370430469513, 0.0011538509279489517, 0.0012038648128509521, 0.0012538786977529526, 0.001303892582654953, 0.0013539064675569534, 0.0014039203524589539, 0.0014539342373609543, 0.0015039481222629547, 0.0015539620071649551, 0.0016039758920669556, 0.001653989776968956, 0.0017040036618709564, 0.0017540175467729568, 0.0018040314316749573, 0.0018540453165769577, 0.0019040592014789581, 0.0019540730863809586, 0.002004086971282959]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 19.0, 23.0, 26.0, 37.0, 54.0, 88.0, 94.0, 125.0, 196.0, 275.0, 353.0, 537.0, 721.0, 1021.0, 1511.0, 2156.0, 3350.0, 4873.0, 7661.0, 12315.0, 20738.0, 45198.0, 485957.0, 365725.0, 41618.0, 19696.0, 11756.0, 7414.0, 4731.0, 3174.0, 2113.0, 1478.0, 1012.0, 693.0, 507.0, 364.0, 256.0, 182.0, 133.0, 104.0, 69.0, 55.0, 28.0, 29.0, 19.0, 19.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-17.6875, -17.134033203125, -16.58056640625, -16.027099609375, -15.4736328125, -14.920166015625, -14.36669921875, -13.813232421875, -13.259765625, -12.706298828125, -12.15283203125, -11.599365234375, -11.0458984375, -10.492431640625, -9.93896484375, -9.385498046875, -8.83203125, -8.278564453125, -7.72509765625, -7.171630859375, -6.6181640625, -6.064697265625, -5.51123046875, -4.957763671875, -4.404296875, -3.850830078125, -3.29736328125, -2.743896484375, -2.1904296875, -1.636962890625, -1.08349609375, -0.530029296875, 0.0234375, 0.576904296875, 1.13037109375, 1.683837890625, 2.2373046875, 2.790771484375, 3.34423828125, 3.897705078125, 4.451171875, 5.004638671875, 5.55810546875, 6.111572265625, 6.6650390625, 7.218505859375, 7.77197265625, 8.325439453125, 8.87890625, 9.432373046875, 9.98583984375, 10.539306640625, 11.0927734375, 11.646240234375, 12.19970703125, 12.753173828125, 13.306640625, 13.860107421875, 14.41357421875, 14.967041015625, 15.5205078125, 16.073974609375, 16.62744140625, 17.180908203125, 17.734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 12.0, 14.0, 17.0, 16.0, 20.0, 33.0, 17.0, 34.0, 35.0, 38.0, 52.0, 43.0, 79.0, 131.0, 1648.0, 281.0, 98.0, 72.0, 57.0, 51.0, 36.0, 28.0, 35.0, 27.0, 19.0, 20.0, 20.0, 6.0, 7.0, 14.0, 10.0, 10.0, 4.0, 6.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -35.01806640625, -33.8798828125, -32.74169921875, -31.603515625, -30.46533203125, -29.3271484375, -28.18896484375, -27.05078125, -25.91259765625, -24.7744140625, -23.63623046875, -22.498046875, -21.35986328125, -20.2216796875, -19.08349609375, -17.9453125, -16.80712890625, -15.6689453125, -14.53076171875, -13.392578125, -12.25439453125, -11.1162109375, -9.97802734375, -8.83984375, -7.70166015625, -6.5634765625, -5.42529296875, -4.287109375, -3.14892578125, -2.0107421875, -0.87255859375, 0.265625, 1.40380859375, 2.5419921875, 3.68017578125, 4.818359375, 5.95654296875, 7.0947265625, 8.23291015625, 9.37109375, 10.50927734375, 11.6474609375, 12.78564453125, 13.923828125, 15.06201171875, 16.2001953125, 17.33837890625, 18.4765625, 19.61474609375, 20.7529296875, 21.89111328125, 23.029296875, 24.16748046875, 25.3056640625, 26.44384765625, 27.58203125, 28.72021484375, 29.8583984375, 30.99658203125, 32.134765625, 33.27294921875, 34.4111328125, 35.54931640625, 36.6875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 14.0, 19.0, 18.0, 35.0, 32.0, 37.0, 44.0, 68.0, 102.0, 123.0, 228.0, 481.0, 1618.0, 7972.0, 73557.0, 3010436.0, 42776.0, 5825.0, 1201.0, 376.0, 188.0, 127.0, 82.0, 71.0, 46.0, 47.0, 32.0, 31.0, 21.0, 21.0, 13.0, 14.0, 3.0, 8.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.125, -72.654296875, -70.18359375, -67.712890625, -65.2421875, -62.771484375, -60.30078125, -57.830078125, -55.359375, -52.888671875, -50.41796875, -47.947265625, -45.4765625, -43.005859375, -40.53515625, -38.064453125, -35.59375, -33.123046875, -30.65234375, -28.181640625, -25.7109375, -23.240234375, -20.76953125, -18.298828125, -15.828125, -13.357421875, -10.88671875, -8.416015625, -5.9453125, -3.474609375, -1.00390625, 1.466796875, 3.9375, 6.408203125, 8.87890625, 11.349609375, 13.8203125, 16.291015625, 18.76171875, 21.232421875, 23.703125, 26.173828125, 28.64453125, 31.115234375, 33.5859375, 36.056640625, 38.52734375, 40.998046875, 43.46875, 45.939453125, 48.41015625, 50.880859375, 53.3515625, 55.822265625, 58.29296875, 60.763671875, 63.234375, 65.705078125, 68.17578125, 70.646484375, 73.1171875, 75.587890625, 78.05859375, 80.529296875, 83.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 57.0, 115.0, 327.0, 268.0, 162.0, 52.0, 13.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.46795654296875, -282.6966857910156, -276.9254455566406, -271.1541748046875, -265.3829345703125, -259.6116638183594, -253.84042358398438, -248.0691680908203, -242.29791259765625, -236.5266571044922, -230.75540161132812, -224.98414611816406, -219.212890625, -213.44163513183594, -207.67037963867188, -201.8991241455078, -196.12786865234375, -190.3566131591797, -184.58535766601562, -178.81410217285156, -173.0428466796875, -167.27159118652344, -161.50033569335938, -155.7290802001953, -149.9578094482422, -144.18655395507812, -138.41529846191406, -132.64404296875, -126.87278747558594, -121.10153198242188, -115.33027648925781, -109.55902099609375, -103.78777313232422, -98.01651763916016, -92.2452621459961, -86.47400665283203, -80.70275115966797, -74.9314956665039, -69.16023254394531, -63.388980865478516, -57.61772537231445, -51.84646987915039, -46.07521438598633, -40.303955078125, -34.53269958496094, -28.761445999145508, -22.990188598632812, -17.21893310546875, -11.447677612304688, -5.676421642303467, 0.0948343276977539, 5.866090774536133, 11.637346267700195, 17.408601760864258, 23.179859161376953, 28.951114654541016, 34.72237014770508, 40.49362564086914, 46.2648811340332, 52.03614044189453, 57.807395935058594, 63.578651428222656, 69.34990692138672, 75.12116241455078, 80.89241790771484]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 10.0, 5.0, 11.0, 15.0, 17.0, 17.0, 18.0, 22.0, 15.0, 19.0, 25.0, 21.0, 28.0, 36.0, 29.0, 43.0, 29.0, 38.0, 39.0, 43.0, 41.0, 44.0, 36.0, 34.0, 39.0, 43.0, 39.0, 32.0, 29.0, 19.0, 21.0, 24.0, 13.0, 20.0, 17.0, 12.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-83.98104095458984, -81.23321533203125, -78.48538970947266, -75.7375717163086, -72.98974609375, -70.2419204711914, -67.49409484863281, -64.74627685546875, -61.998451232910156, -59.25062561035156, -56.502803802490234, -53.75497817993164, -51.00715637207031, -48.25933074951172, -45.511505126953125, -42.7636833190918, -40.0158576965332, -37.26803207397461, -34.52021026611328, -31.772384643554688, -29.02456283569336, -26.276737213134766, -23.528913497924805, -20.781089782714844, -18.033266067504883, -15.285442352294922, -12.537618637084961, -9.789793968200684, -7.041970252990723, -4.294146537780762, -1.5463218688964844, 1.2015018463134766, 3.9493255615234375, 6.697149276733398, 9.44497299194336, 12.192797660827637, 14.940621376037598, 17.688446044921875, 20.436269760131836, 23.184093475341797, 25.931917190551758, 28.67974090576172, 31.42756462097168, 34.17538833618164, 36.923213958740234, 39.67103576660156, 42.418861389160156, 45.16668701171875, 47.91450881958008, 50.66233444213867, 53.41015625, 56.157981872558594, 58.90580368041992, 61.653629302978516, 64.40145111083984, 67.14927673339844, 69.89710235595703, 72.64492797851562, 75.39275360107422, 78.14057159423828, 80.88839721679688, 83.63622283935547, 86.38404846191406, 89.13186645507812, 91.87969207763672]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 8.0, 7.0, 3.0, 8.0, 15.0, 18.0, 20.0, 28.0, 29.0, 32.0, 30.0, 38.0, 30.0, 49.0, 36.0, 38.0, 38.0, 46.0, 49.0, 34.0, 35.0, 39.0, 29.0, 45.0, 35.0, 34.0, 27.0, 38.0, 19.0, 17.0, 20.0, 16.0, 18.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0806884765625, -11.716064453125, -11.3514404296875, -10.98681640625, -10.6221923828125, -10.257568359375, -9.8929443359375, -9.5283203125, -9.1636962890625, -8.799072265625, -8.4344482421875, -8.06982421875, -7.7052001953125, -7.340576171875, -6.9759521484375, -6.611328125, -6.2467041015625, -5.882080078125, -5.5174560546875, -5.15283203125, -4.7882080078125, -4.423583984375, -4.0589599609375, -3.6943359375, -3.3297119140625, -2.965087890625, -2.6004638671875, -2.23583984375, -1.8712158203125, -1.506591796875, -1.1419677734375, -0.77734375, -0.4127197265625, -0.048095703125, 0.3165283203125, 0.68115234375, 1.0457763671875, 1.410400390625, 1.7750244140625, 2.1396484375, 2.5042724609375, 2.868896484375, 3.2335205078125, 3.59814453125, 3.9627685546875, 4.327392578125, 4.6920166015625, 5.056640625, 5.4212646484375, 5.785888671875, 6.1505126953125, 6.51513671875, 6.8797607421875, 7.244384765625, 7.6090087890625, 7.9736328125, 8.3382568359375, 8.702880859375, 9.0675048828125, 9.43212890625, 9.7967529296875, 10.161376953125, 10.5260009765625, 10.890625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 9.0, 5.0, 6.0, 10.0, 17.0, 27.0, 18.0, 34.0, 32.0, 45.0, 59.0, 83.0, 85.0, 144.0, 222.0, 382.0, 672.0, 1366.0, 3198.0, 8733.0, 31378.0, 570900.0, 3307796.0, 235309.0, 22153.0, 6558.0, 2448.0, 1068.0, 529.0, 273.0, 177.0, 118.0, 106.0, 67.0, 54.0, 53.0, 43.0, 20.0, 17.0, 15.0, 12.0, 17.0, 6.0, 2.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.53125, -36.40673828125, -35.2822265625, -34.15771484375, -33.033203125, -31.90869140625, -30.7841796875, -29.65966796875, -28.53515625, -27.41064453125, -26.2861328125, -25.16162109375, -24.037109375, -22.91259765625, -21.7880859375, -20.66357421875, -19.5390625, -18.41455078125, -17.2900390625, -16.16552734375, -15.041015625, -13.91650390625, -12.7919921875, -11.66748046875, -10.54296875, -9.41845703125, -8.2939453125, -7.16943359375, -6.044921875, -4.92041015625, -3.7958984375, -2.67138671875, -1.546875, -0.42236328125, 0.7021484375, 1.82666015625, 2.951171875, 4.07568359375, 5.2001953125, 6.32470703125, 7.44921875, 8.57373046875, 9.6982421875, 10.82275390625, 11.947265625, 13.07177734375, 14.1962890625, 15.32080078125, 16.4453125, 17.56982421875, 18.6943359375, 19.81884765625, 20.943359375, 22.06787109375, 23.1923828125, 24.31689453125, 25.44140625, 26.56591796875, 27.6904296875, 28.81494140625, 29.939453125, 31.06396484375, 32.1884765625, 33.31298828125, 34.4375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 20.0, 24.0, 32.0, 44.0, 55.0, 80.0, 129.0, 254.0, 441.0, 778.0, 852.0, 567.0, 304.0, 137.0, 89.0, 56.0, 44.0, 30.0, 26.0, 17.0, 12.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.734375, -27.8125, -26.890625, -25.96875, -25.046875, -24.125, -23.203125, -22.28125, -21.359375, -20.4375, -19.515625, -18.59375, -17.671875, -16.75, -15.828125, -14.90625, -13.984375, -13.0625, -12.140625, -11.21875, -10.296875, -9.375, -8.453125, -7.53125, -6.609375, -5.6875, -4.765625, -3.84375, -2.921875, -2.0, -1.078125, -0.15625, 0.765625, 1.6875, 2.609375, 3.53125, 4.453125, 5.375, 6.296875, 7.21875, 8.140625, 9.0625, 9.984375, 10.90625, 11.828125, 12.75, 13.671875, 14.59375, 15.515625, 16.4375, 17.359375, 18.28125, 19.203125, 20.125, 21.046875, 21.96875, 22.890625, 23.8125, 24.734375, 25.65625, 26.578125, 27.5, 28.421875, 29.34375, 30.265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 24.0, 29.0, 46.0, 68.0, 123.0, 218.0, 700.0, 3311.0, 41140.0, 3933711.0, 205214.0, 7665.0, 1170.0, 338.0, 181.0, 105.0, 47.0, 46.0, 29.0, 18.0, 15.0, 17.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-105.0, -101.7890625, -98.578125, -95.3671875, -92.15625, -88.9453125, -85.734375, -82.5234375, -79.3125, -76.1015625, -72.890625, -69.6796875, -66.46875, -63.2578125, -60.046875, -56.8359375, -53.625, -50.4140625, -47.203125, -43.9921875, -40.78125, -37.5703125, -34.359375, -31.1484375, -27.9375, -24.7265625, -21.515625, -18.3046875, -15.09375, -11.8828125, -8.671875, -5.4609375, -2.25, 0.9609375, 4.171875, 7.3828125, 10.59375, 13.8046875, 17.015625, 20.2265625, 23.4375, 26.6484375, 29.859375, 33.0703125, 36.28125, 39.4921875, 42.703125, 45.9140625, 49.125, 52.3359375, 55.546875, 58.7578125, 61.96875, 65.1796875, 68.390625, 71.6015625, 74.8125, 78.0234375, 81.234375, 84.4453125, 87.65625, 90.8671875, 94.078125, 97.2890625, 100.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 21.0, 37.0, 85.0, 142.0, 232.0, 217.0, 135.0, 70.0, 33.0, 18.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.5796890258789, -107.28607940673828, -100.99246215820312, -94.6988525390625, -88.40523529052734, -82.11162567138672, -75.81800842285156, -69.52439880371094, -63.23078536987305, -56.937171936035156, -50.643558502197266, -44.349945068359375, -38.05633544921875, -31.762720108032227, -25.46910858154297, -19.175495147705078, -12.881881713867188, -6.588268756866455, -0.29465579986572266, 5.998956680297852, 12.292570114135742, 18.586183547973633, 24.87979507446289, 31.17340850830078, 37.46702194213867, 43.76063537597656, 50.05424880981445, 56.347862243652344, 62.64147186279297, 68.93508911132812, 75.22869873046875, 81.52230834960938, 87.81593322753906, 94.10954284667969, 100.40316009521484, 106.69676971435547, 112.99038696289062, 119.28399658203125, 125.57760620117188, 131.8712158203125, 138.1648406982422, 144.4584503173828, 150.75205993652344, 157.04568481445312, 163.33929443359375, 169.63290405273438, 175.926513671875, 182.22012329101562, 188.51373291015625, 194.80734252929688, 201.1009521484375, 207.3945770263672, 213.6881866455078, 219.98179626464844, 226.27540588378906, 232.56903076171875, 238.86264038085938, 245.15625, 251.44985961914062, 257.74346923828125, 264.0370788574219, 270.3307189941406, 276.62432861328125, 282.9179382324219, 289.2115478515625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 14.0, 11.0, 14.0, 23.0, 17.0, 19.0, 16.0, 30.0, 24.0, 38.0, 33.0, 32.0, 41.0, 36.0, 40.0, 36.0, 39.0, 39.0, 49.0, 27.0, 36.0, 45.0, 29.0, 34.0, 29.0, 24.0, 22.0, 29.0, 24.0, 27.0, 13.0, 14.0, 8.0, 12.0, 8.0, 8.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.63673400878906, -63.30698776245117, -60.97724533081055, -58.647499084472656, -56.31775665283203, -53.98801040649414, -51.65826416015625, -49.328521728515625, -46.998775482177734, -44.669029235839844, -42.33928680419922, -40.00954055786133, -37.67979431152344, -35.35005187988281, -33.02030563354492, -30.690561294555664, -28.360816955566406, -26.03107261657715, -23.70132827758789, -21.37158203125, -19.041837692260742, -16.712093353271484, -14.38234806060791, -12.052602767944336, -9.722858428955078, -7.393113613128662, -5.063368797302246, -2.73362398147583, -0.40387916564941406, 1.9258651733398438, 4.255610466003418, 6.585355758666992, 8.91510009765625, 11.244844436645508, 13.574589729309082, 15.904335021972656, 18.234079360961914, 20.563823699951172, 22.893569946289062, 25.22331428527832, 27.553058624267578, 29.882802963256836, 32.212547302246094, 34.542293548583984, 36.872039794921875, 39.2017822265625, 41.53152847290039, 43.86127471923828, 46.191017150878906, 48.5207633972168, 50.85050582885742, 53.18025207519531, 55.50999450683594, 57.83974075317383, 60.16948699951172, 62.499229431152344, 64.8289794921875, 67.15872192382812, 69.48847198486328, 71.8182144165039, 74.14795684814453, 76.47770690917969, 78.80744934082031, 81.13719177246094, 83.46693420410156]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 15.0, 13.0, 16.0, 36.0, 43.0, 84.0, 125.0, 181.0, 316.0, 498.0, 824.0, 1199.0, 2013.0, 3313.0, 5221.0, 8644.0, 14412.0, 24489.0, 42307.0, 73871.0, 133143.0, 238699.0, 217301.0, 119529.0, 67412.0, 38504.0, 22531.0, 13167.0, 8006.0, 4710.0, 2983.0, 1874.0, 1120.0, 724.0, 440.0, 295.0, 174.0, 114.0, 73.0, 44.0, 31.0, 28.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.32666015625, -0.3170280456542969, -0.30739593505859375, -0.2977638244628906, -0.2881317138671875, -0.2784996032714844, -0.26886749267578125, -0.2592353820800781, -0.249603271484375, -0.23997116088867188, -0.23033905029296875, -0.22070693969726562, -0.2110748291015625, -0.20144271850585938, -0.19181060791015625, -0.18217849731445312, -0.17254638671875, -0.16291427612304688, -0.15328216552734375, -0.14365005493164062, -0.1340179443359375, -0.12438583374023438, -0.11475372314453125, -0.10512161254882812, -0.095489501953125, -0.08585739135742188, -0.07622528076171875, -0.06659317016601562, -0.0569610595703125, -0.047328948974609375, -0.03769683837890625, -0.028064727783203125, -0.0184326171875, -0.008800506591796875, 0.00083160400390625, 0.010463714599609375, 0.0200958251953125, 0.029727935791015625, 0.03936004638671875, 0.048992156982421875, 0.058624267578125, 0.06825637817382812, 0.07788848876953125, 0.08752059936523438, 0.0971527099609375, 0.10678482055664062, 0.11641693115234375, 0.12604904174804688, 0.13568115234375, 0.14531326293945312, 0.15494537353515625, 0.16457748413085938, 0.1742095947265625, 0.18384170532226562, 0.19347381591796875, 0.20310592651367188, 0.212738037109375, 0.22237014770507812, 0.23200225830078125, 0.24163436889648438, 0.2512664794921875, 0.2608985900878906, 0.27053070068359375, 0.2801628112792969, 0.289794921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 5.0, 6.0, 10.0, 13.0, 11.0, 14.0, 17.0, 27.0, 21.0, 30.0, 25.0, 37.0, 38.0, 37.0, 32.0, 31.0, 39.0, 32.0, 51.0, 1067.0, 39.0, 47.0, 36.0, 42.0, 36.0, 39.0, 28.0, 31.0, 31.0, 24.0, 16.0, 26.0, 12.0, 12.0, 15.0, 9.0, 9.0, 5.0, 4.0, 6.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.75, -9.458984375, -9.16796875, -8.876953125, -8.5859375, -8.294921875, -8.00390625, -7.712890625, -7.421875, -7.130859375, -6.83984375, -6.548828125, -6.2578125, -5.966796875, -5.67578125, -5.384765625, -5.09375, -4.802734375, -4.51171875, -4.220703125, -3.9296875, -3.638671875, -3.34765625, -3.056640625, -2.765625, -2.474609375, -2.18359375, -1.892578125, -1.6015625, -1.310546875, -1.01953125, -0.728515625, -0.4375, -0.146484375, 0.14453125, 0.435546875, 0.7265625, 1.017578125, 1.30859375, 1.599609375, 1.890625, 2.181640625, 2.47265625, 2.763671875, 3.0546875, 3.345703125, 3.63671875, 3.927734375, 4.21875, 4.509765625, 4.80078125, 5.091796875, 5.3828125, 5.673828125, 5.96484375, 6.255859375, 6.546875, 6.837890625, 7.12890625, 7.419921875, 7.7109375, 8.001953125, 8.29296875, 8.583984375, 8.875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 5.0, 2.0, 4.0, 3.0, 7.0, 14.0, 14.0, 12.0, 16.0, 39.0, 59.0, 61.0, 113.0, 156.0, 228.0, 322.0, 471.0, 650.0, 899.0, 1292.0, 1877.0, 2677.0, 3955.0, 5607.0, 8550.0, 13106.0, 19830.0, 30262.0, 46790.0, 72628.0, 116999.0, 311714.0, 1123449.0, 119730.0, 75081.0, 47820.0, 31141.0, 20526.0, 13401.0, 8696.0, 5947.0, 3919.0, 2728.0, 1902.0, 1266.0, 909.0, 671.0, 440.0, 350.0, 252.0, 169.0, 112.0, 85.0, 63.0, 49.0, 29.0, 20.0, 13.0, 4.0, 5.0, 3.0, 0.0, 5.0], "bins": [-0.1302490234375, -0.12630558013916016, -0.12236213684082031, -0.11841869354248047, -0.11447525024414062, -0.11053180694580078, -0.10658836364746094, -0.1026449203491211, -0.09870147705078125, -0.0947580337524414, -0.09081459045410156, -0.08687114715576172, -0.08292770385742188, -0.07898426055908203, -0.07504081726074219, -0.07109737396240234, -0.0671539306640625, -0.06321048736572266, -0.05926704406738281, -0.05532360076904297, -0.051380157470703125, -0.04743671417236328, -0.04349327087402344, -0.039549827575683594, -0.03560638427734375, -0.031662940979003906, -0.027719497680664062, -0.02377605438232422, -0.019832611083984375, -0.01588916778564453, -0.011945724487304688, -0.008002281188964844, -0.004058837890625, -0.00011539459228515625, 0.0038280487060546875, 0.007771492004394531, 0.011714935302734375, 0.01565837860107422, 0.019601821899414062, 0.023545265197753906, 0.02748870849609375, 0.031432151794433594, 0.03537559509277344, 0.03931903839111328, 0.043262481689453125, 0.04720592498779297, 0.05114936828613281, 0.055092811584472656, 0.0590362548828125, 0.06297969818115234, 0.06692314147949219, 0.07086658477783203, 0.07481002807617188, 0.07875347137451172, 0.08269691467285156, 0.0866403579711914, 0.09058380126953125, 0.0945272445678711, 0.09847068786621094, 0.10241413116455078, 0.10635757446289062, 0.11030101776123047, 0.11424446105957031, 0.11818790435791016, 0.12213134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 3.0, 1.0, 6.0, 9.0, 13.0, 12.0, 9.0, 16.0, 17.0, 17.0, 20.0, 15.0, 37.0, 30.0, 34.0, 36.0, 49.0, 41.0, 43.0, 62.0, 59.0, 51.0, 44.0, 52.0, 42.0, 43.0, 28.0, 33.0, 30.0, 27.0, 13.0, 16.0, 13.0, 16.0, 8.0, 13.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0009794235229492188, -0.0009486228227615356, -0.0009178221225738525, -0.0008870214223861694, -0.0008562207221984863, -0.0008254200220108032, -0.0007946193218231201, -0.000763818621635437, -0.0007330179214477539, -0.0007022172212600708, -0.0006714165210723877, -0.0006406158208847046, -0.0006098151206970215, -0.0005790144205093384, -0.0005482137203216553, -0.0005174130201339722, -0.00048661231994628906, -0.00045581161975860596, -0.00042501091957092285, -0.00039421021938323975, -0.00036340951919555664, -0.00033260881900787354, -0.00030180811882019043, -0.0002710074186325073, -0.00024020671844482422, -0.0002094060182571411, -0.000178605318069458, -0.0001478046178817749, -0.0001170039176940918, -8.620321750640869e-05, -5.5402517318725586e-05, -2.460181713104248e-05, 6.198883056640625e-06, 3.699958324432373e-05, 6.780028343200684e-05, 9.860098361968994e-05, 0.00012940168380737305, 0.00016020238399505615, 0.00019100308418273926, 0.00022180378437042236, 0.00025260448455810547, 0.0002834051847457886, 0.0003142058849334717, 0.0003450065851211548, 0.0003758072853088379, 0.000406607985496521, 0.0004374086856842041, 0.0004682093858718872, 0.0004990100860595703, 0.0005298107862472534, 0.0005606114864349365, 0.0005914121866226196, 0.0006222128868103027, 0.0006530135869979858, 0.0006838142871856689, 0.000714614987373352, 0.0007454156875610352, 0.0007762163877487183, 0.0008070170879364014, 0.0008378177881240845, 0.0008686184883117676, 0.0008994191884994507, 0.0009302198886871338, 0.0009610205888748169, 0.0009918212890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 7.0, 11.0, 8.0, 17.0, 12.0, 15.0, 16.0, 28.0, 35.0, 35.0, 44.0, 89.0, 180.0, 401.0, 1119.0, 55831.0, 986733.0, 2675.0, 581.0, 232.0, 115.0, 68.0, 53.0, 33.0, 35.0, 18.0, 19.0, 18.0, 20.0, 14.0, 9.0, 11.0, 14.0, 8.0, 6.0, 2.0, 3.0, 6.0, 9.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0220184326171875, -0.02133488655090332, -0.02065134048461914, -0.01996779441833496, -0.01928424835205078, -0.0186007022857666, -0.017917156219482422, -0.017233610153198242, -0.016550064086914062, -0.015866518020629883, -0.015182971954345703, -0.014499425888061523, -0.013815879821777344, -0.013132333755493164, -0.012448787689208984, -0.011765241622924805, -0.011081695556640625, -0.010398149490356445, -0.009714603424072266, -0.009031057357788086, -0.008347511291503906, -0.0076639652252197266, -0.006980419158935547, -0.006296873092651367, -0.0056133270263671875, -0.004929780960083008, -0.004246234893798828, -0.0035626888275146484, -0.0028791427612304688, -0.002195596694946289, -0.0015120506286621094, -0.0008285045623779297, -0.00014495849609375, 0.0005385875701904297, 0.0012221336364746094, 0.001905679702758789, 0.0025892257690429688, 0.0032727718353271484, 0.003956317901611328, 0.004639863967895508, 0.0053234100341796875, 0.006006956100463867, 0.006690502166748047, 0.0073740482330322266, 0.008057594299316406, 0.008741140365600586, 0.009424686431884766, 0.010108232498168945, 0.010791778564453125, 0.011475324630737305, 0.012158870697021484, 0.012842416763305664, 0.013525962829589844, 0.014209508895874023, 0.014893054962158203, 0.015576601028442383, 0.016260147094726562, 0.016943693161010742, 0.017627239227294922, 0.0183107852935791, 0.01899433135986328, 0.01967787742614746, 0.02036142349243164, 0.02104496955871582, 0.021728515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 397.0, 613.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022900115698575974, -0.022442439571022987, -0.02198476344347, -0.021527087315917015, -0.02106941118836403, -0.020611733198165894, -0.020154058933258057, -0.01969638094305992, -0.019238704815506935, -0.01878102868795395, -0.018323352560400963, -0.017865676432847977, -0.01740800030529499, -0.016950324177742004, -0.01649264618754387, -0.016034970059990883, -0.015577294863760471, -0.015119618736207485, -0.014661942608654499, -0.014204265549778938, -0.013746589422225952, -0.013288913294672966, -0.01283123716711998, -0.012373561039566994, -0.011915884912014008, -0.011458208784461021, -0.011000532656908035, -0.01054285652935505, -0.010085179470479488, -0.009627503342926502, -0.009169827215373516, -0.00871215108782053, -0.008254473097622395, -0.007796796970069408, -0.007339120376855135, -0.006881444249302149, -0.006423767656087875, -0.005966091528534889, -0.005508415400981903, -0.005050739273428917, -0.0045930626802146435, -0.004135386552661657, -0.003677709959447384, -0.0032200338318943977, -0.002762357471510768, -0.002304681111127138, -0.001847004983574152, -0.0013893286231905222, -0.0009316522628068924, -0.0004739759606309235, -1.6299658454954624e-05, 0.00044137658551335335, 0.0008990529458969831, 0.001356729306280613, 0.001814405433833599, 0.002272081794217229, 0.0027297581546008587, 0.0031874345149844885, 0.0036451108753681183, 0.004102787002921104, 0.004560463130474091, 0.005018139723688364, 0.00547581585124135, 0.005933492444455624, 0.00639116857200861]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 9.0, 12.0, 16.0, 13.0, 24.0, 25.0, 34.0, 29.0, 31.0, 35.0, 40.0, 49.0, 55.0, 52.0, 48.0, 44.0, 56.0, 47.0, 43.0, 33.0, 49.0, 43.0, 35.0, 31.0, 28.0, 19.0, 14.0, 15.0, 14.0, 12.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010987520217895508, -0.0010580597445368767, -0.0010173674672842026, -0.0009766751900315285, -0.0009359829127788544, -0.0008952906355261803, -0.0008545983582735062, -0.0008139060810208321, -0.000773213803768158, -0.0007325215265154839, -0.0006918292492628098, -0.0006511369720101357, -0.0006104446947574615, -0.0005697524175047874, -0.0005290601402521133, -0.0004883678629994392, -0.00044767558574676514, -0.00040698330849409103, -0.00036629103124141693, -0.00032559875398874283, -0.0002849064767360687, -0.0002442141994833946, -0.00020352192223072052, -0.00016282964497804642, -0.00012213736772537231, -8.144509047269821e-05, -4.075281322002411e-05, -6.05359673500061e-08, 4.06317412853241e-05, 8.13240185379982e-05, 0.0001220162957906723, 0.0001627085730433464, 0.0002034008502960205, 0.0002440931275486946, 0.0002847854048013687, 0.0003254776820540428, 0.0003661699593067169, 0.000406862236559391, 0.0004475545138120651, 0.00048824679106473923, 0.0005289390683174133, 0.0005696313455700874, 0.0006103236228227615, 0.0006510159000754356, 0.0006917081773281097, 0.0007324004545807838, 0.000773092731833458, 0.000813785009086132, 0.0008544772863388062, 0.0008951695635914803, 0.0009358618408441544, 0.0009765541180968285, 0.0010172463953495026, 0.0010579386726021767, 0.0010986309498548508, 0.0011393232271075249, 0.001180015504360199, 0.001220707781612873, 0.0012614000588655472, 0.0013020923361182213, 0.0013427846133708954, 0.0013834768906235695, 0.0014241691678762436, 0.0014648614451289177, 0.0015055537223815918]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 11.0, 17.0, 22.0, 31.0, 37.0, 67.0, 80.0, 126.0, 149.0, 221.0, 327.0, 492.0, 777.0, 1082.0, 1694.0, 2586.0, 4183.0, 7570.0, 15172.0, 48859.0, 613288.0, 289859.0, 32559.0, 12322.0, 6343.0, 3751.0, 2301.0, 1478.0, 991.0, 644.0, 457.0, 302.0, 218.0, 176.0, 94.0, 64.0, 64.0, 32.0, 26.0, 10.0, 21.0, 8.0, 12.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-17.015625, -16.51318359375, -16.0107421875, -15.50830078125, -15.005859375, -14.50341796875, -14.0009765625, -13.49853515625, -12.99609375, -12.49365234375, -11.9912109375, -11.48876953125, -10.986328125, -10.48388671875, -9.9814453125, -9.47900390625, -8.9765625, -8.47412109375, -7.9716796875, -7.46923828125, -6.966796875, -6.46435546875, -5.9619140625, -5.45947265625, -4.95703125, -4.45458984375, -3.9521484375, -3.44970703125, -2.947265625, -2.44482421875, -1.9423828125, -1.43994140625, -0.9375, -0.43505859375, 0.0673828125, 0.56982421875, 1.072265625, 1.57470703125, 2.0771484375, 2.57958984375, 3.08203125, 3.58447265625, 4.0869140625, 4.58935546875, 5.091796875, 5.59423828125, 6.0966796875, 6.59912109375, 7.1015625, 7.60400390625, 8.1064453125, 8.60888671875, 9.111328125, 9.61376953125, 10.1162109375, 10.61865234375, 11.12109375, 11.62353515625, 12.1259765625, 12.62841796875, 13.130859375, 13.63330078125, 14.1357421875, 14.63818359375, 15.140625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 10.0, 15.0, 18.0, 17.0, 26.0, 30.0, 32.0, 46.0, 53.0, 33.0, 46.0, 58.0, 80.0, 378.0, 1619.0, 92.0, 65.0, 55.0, 44.0, 38.0, 29.0, 41.0, 25.0, 34.0, 18.0, 18.0, 13.0, 17.0, 8.0, 6.0, 11.0, 5.0, 3.0, 6.0, 9.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.41650390625, -33.1455078125, -31.87451171875, -30.603515625, -29.33251953125, -28.0615234375, -26.79052734375, -25.51953125, -24.24853515625, -22.9775390625, -21.70654296875, -20.435546875, -19.16455078125, -17.8935546875, -16.62255859375, -15.3515625, -14.08056640625, -12.8095703125, -11.53857421875, -10.267578125, -8.99658203125, -7.7255859375, -6.45458984375, -5.18359375, -3.91259765625, -2.6416015625, -1.37060546875, -0.099609375, 1.17138671875, 2.4423828125, 3.71337890625, 4.984375, 6.25537109375, 7.5263671875, 8.79736328125, 10.068359375, 11.33935546875, 12.6103515625, 13.88134765625, 15.15234375, 16.42333984375, 17.6943359375, 18.96533203125, 20.236328125, 21.50732421875, 22.7783203125, 24.04931640625, 25.3203125, 26.59130859375, 27.8623046875, 29.13330078125, 30.404296875, 31.67529296875, 32.9462890625, 34.21728515625, 35.48828125, 36.75927734375, 38.0302734375, 39.30126953125, 40.572265625, 41.84326171875, 43.1142578125, 44.38525390625, 45.65625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 10.0, 7.0, 7.0, 11.0, 12.0, 8.0, 12.0, 19.0, 27.0, 25.0, 40.0, 61.0, 75.0, 90.0, 101.0, 150.0, 266.0, 698.0, 2972.0, 23391.0, 2989555.0, 118163.0, 7421.0, 1394.0, 388.0, 205.0, 135.0, 109.0, 77.0, 66.0, 47.0, 39.0, 31.0, 20.0, 12.0, 12.0, 10.0, 13.0, 9.0, 11.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-82.8125, -80.49609375, -78.1796875, -75.86328125, -73.546875, -71.23046875, -68.9140625, -66.59765625, -64.28125, -61.96484375, -59.6484375, -57.33203125, -55.015625, -52.69921875, -50.3828125, -48.06640625, -45.75, -43.43359375, -41.1171875, -38.80078125, -36.484375, -34.16796875, -31.8515625, -29.53515625, -27.21875, -24.90234375, -22.5859375, -20.26953125, -17.953125, -15.63671875, -13.3203125, -11.00390625, -8.6875, -6.37109375, -4.0546875, -1.73828125, 0.578125, 2.89453125, 5.2109375, 7.52734375, 9.84375, 12.16015625, 14.4765625, 16.79296875, 19.109375, 21.42578125, 23.7421875, 26.05859375, 28.375, 30.69140625, 33.0078125, 35.32421875, 37.640625, 39.95703125, 42.2734375, 44.58984375, 46.90625, 49.22265625, 51.5390625, 53.85546875, 56.171875, 58.48828125, 60.8046875, 63.12109375, 65.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 28.0, 447.0, 512.0, 33.0], "bins": [-662.664794921875, -651.9754638671875, -641.2861938476562, -630.5968627929688, -619.9075927734375, -609.21826171875, -598.5289916992188, -587.8396606445312, -577.150390625, -566.4610595703125, -555.7717895507812, -545.0824584960938, -534.3931884765625, -523.703857421875, -513.0145874023438, -502.3252868652344, -491.635986328125, -480.9466857910156, -470.25738525390625, -459.5680847167969, -448.8787841796875, -438.1894836425781, -427.50018310546875, -416.8108825683594, -406.1215515136719, -395.4322509765625, -384.7429504394531, -374.05364990234375, -363.3643493652344, -352.675048828125, -341.9857482910156, -331.29644775390625, -320.6071472167969, -309.9178466796875, -299.2285461425781, -288.53924560546875, -277.8499450683594, -267.16064453125, -256.4713439941406, -245.78204345703125, -235.09274291992188, -224.4034423828125, -213.71414184570312, -203.02484130859375, -192.33554077148438, -181.646240234375, -170.95693969726562, -160.26763916015625, -149.57833862304688, -138.8890380859375, -128.19973754882812, -117.51043701171875, -106.82113647460938, -96.1318359375, -85.4425277709961, -74.75322723388672, -64.06391906738281, -53.37461853027344, -42.68531799316406, -31.996013641357422, -21.306713104248047, -10.617412567138672, 0.07189178466796875, 10.761192321777344, 21.450489044189453]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 6.0, 6.0, 12.0, 10.0, 15.0, 11.0, 16.0, 19.0, 21.0, 24.0, 40.0, 35.0, 28.0, 24.0, 32.0, 28.0, 40.0, 43.0, 40.0, 34.0, 35.0, 32.0, 35.0, 37.0, 35.0, 41.0, 32.0, 33.0, 34.0, 31.0, 22.0, 17.0, 11.0, 20.0, 10.0, 14.0, 12.0, 5.0, 13.0, 8.0, 6.0, 5.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.49776458740234, -78.55269622802734, -75.60762786865234, -72.66256713867188, -69.71749877929688, -66.77243041992188, -63.827362060546875, -60.88229751586914, -57.937232971191406, -54.992164611816406, -52.04710006713867, -49.10203170776367, -46.15696716308594, -43.21189880371094, -40.26683044433594, -37.3217658996582, -34.3766975402832, -31.431631088256836, -28.48656463623047, -25.54149627685547, -22.596431732177734, -19.651363372802734, -16.706296920776367, -13.76123046875, -10.816164016723633, -7.871097564697266, -4.92603063583374, -1.9809637069702148, 0.9641027450561523, 3.9091691970825195, 6.854236602783203, 9.79930305480957, 12.744369506835938, 15.689435958862305, 18.634502410888672, 21.579570770263672, 24.524635314941406, 27.469703674316406, 30.414770126342773, 33.35983657836914, 36.304901123046875, 39.249969482421875, 42.19503402709961, 45.14010238647461, 48.085166931152344, 51.030235290527344, 53.975303649902344, 56.92036819458008, 59.86543655395508, 62.81050491333008, 65.75556945800781, 68.70063781738281, 71.64570617675781, 74.59076690673828, 77.53583526611328, 80.48090362548828, 83.42597198486328, 86.37104034423828, 89.31610870361328, 92.26116943359375, 95.20623779296875, 98.15130615234375, 101.09637451171875, 104.04144287109375, 106.98650360107422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 11.0, 16.0, 18.0, 14.0, 14.0, 23.0, 37.0, 34.0, 39.0, 32.0, 39.0, 37.0, 36.0, 55.0, 44.0, 44.0, 41.0, 52.0, 33.0, 30.0, 34.0, 47.0, 24.0, 28.0, 23.0, 36.0, 20.0, 22.0, 13.0, 10.0, 13.0, 11.0, 8.0, 10.0, 4.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-13.3125, -12.939453125, -12.56640625, -12.193359375, -11.8203125, -11.447265625, -11.07421875, -10.701171875, -10.328125, -9.955078125, -9.58203125, -9.208984375, -8.8359375, -8.462890625, -8.08984375, -7.716796875, -7.34375, -6.970703125, -6.59765625, -6.224609375, -5.8515625, -5.478515625, -5.10546875, -4.732421875, -4.359375, -3.986328125, -3.61328125, -3.240234375, -2.8671875, -2.494140625, -2.12109375, -1.748046875, -1.375, -1.001953125, -0.62890625, -0.255859375, 0.1171875, 0.490234375, 0.86328125, 1.236328125, 1.609375, 1.982421875, 2.35546875, 2.728515625, 3.1015625, 3.474609375, 3.84765625, 4.220703125, 4.59375, 4.966796875, 5.33984375, 5.712890625, 6.0859375, 6.458984375, 6.83203125, 7.205078125, 7.578125, 7.951171875, 8.32421875, 8.697265625, 9.0703125, 9.443359375, 9.81640625, 10.189453125, 10.5625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 14.0, 13.0, 12.0, 24.0, 35.0, 31.0, 55.0, 92.0, 91.0, 125.0, 195.0, 303.0, 472.0, 828.0, 1396.0, 2610.0, 5371.0, 12949.0, 42954.0, 442248.0, 2901188.0, 692827.0, 60820.0, 15952.0, 6480.0, 3049.0, 1582.0, 910.0, 530.0, 327.0, 234.0, 156.0, 100.0, 67.0, 48.0, 32.0, 28.0, 27.0, 21.0, 17.0, 11.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-29.03125, -28.19189453125, -27.3525390625, -26.51318359375, -25.673828125, -24.83447265625, -23.9951171875, -23.15576171875, -22.31640625, -21.47705078125, -20.6376953125, -19.79833984375, -18.958984375, -18.11962890625, -17.2802734375, -16.44091796875, -15.6015625, -14.76220703125, -13.9228515625, -13.08349609375, -12.244140625, -11.40478515625, -10.5654296875, -9.72607421875, -8.88671875, -8.04736328125, -7.2080078125, -6.36865234375, -5.529296875, -4.68994140625, -3.8505859375, -3.01123046875, -2.171875, -1.33251953125, -0.4931640625, 0.34619140625, 1.185546875, 2.02490234375, 2.8642578125, 3.70361328125, 4.54296875, 5.38232421875, 6.2216796875, 7.06103515625, 7.900390625, 8.73974609375, 9.5791015625, 10.41845703125, 11.2578125, 12.09716796875, 12.9365234375, 13.77587890625, 14.615234375, 15.45458984375, 16.2939453125, 17.13330078125, 17.97265625, 18.81201171875, 19.6513671875, 20.49072265625, 21.330078125, 22.16943359375, 23.0087890625, 23.84814453125, 24.6875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 6.0, 5.0, 11.0, 12.0, 6.0, 16.0, 17.0, 21.0, 32.0, 45.0, 51.0, 64.0, 79.0, 139.0, 201.0, 310.0, 549.0, 640.0, 610.0, 426.0, 243.0, 151.0, 91.0, 80.0, 60.0, 39.0, 37.0, 20.0, 16.0, 17.0, 12.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.747314453125, -20.07275390625, -19.398193359375, -18.7236328125, -18.049072265625, -17.37451171875, -16.699951171875, -16.025390625, -15.350830078125, -14.67626953125, -14.001708984375, -13.3271484375, -12.652587890625, -11.97802734375, -11.303466796875, -10.62890625, -9.954345703125, -9.27978515625, -8.605224609375, -7.9306640625, -7.256103515625, -6.58154296875, -5.906982421875, -5.232421875, -4.557861328125, -3.88330078125, -3.208740234375, -2.5341796875, -1.859619140625, -1.18505859375, -0.510498046875, 0.1640625, 0.838623046875, 1.51318359375, 2.187744140625, 2.8623046875, 3.536865234375, 4.21142578125, 4.885986328125, 5.560546875, 6.235107421875, 6.90966796875, 7.584228515625, 8.2587890625, 8.933349609375, 9.60791015625, 10.282470703125, 10.95703125, 11.631591796875, 12.30615234375, 12.980712890625, 13.6552734375, 14.329833984375, 15.00439453125, 15.678955078125, 16.353515625, 17.028076171875, 17.70263671875, 18.377197265625, 19.0517578125, 19.726318359375, 20.40087890625, 21.075439453125, 21.75]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 7.0, 8.0, 12.0, 17.0, 17.0, 26.0, 40.0, 52.0, 79.0, 105.0, 191.0, 467.0, 2148.0, 22950.0, 3268477.0, 883111.0, 14082.0, 1440.0, 416.0, 171.0, 108.0, 66.0, 65.0, 45.0, 23.0, 25.0, 20.0, 12.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.9560546875, -94.787109375, -91.6181640625, -88.44921875, -85.2802734375, -82.111328125, -78.9423828125, -75.7734375, -72.6044921875, -69.435546875, -66.2666015625, -63.09765625, -59.9287109375, -56.759765625, -53.5908203125, -50.421875, -47.2529296875, -44.083984375, -40.9150390625, -37.74609375, -34.5771484375, -31.408203125, -28.2392578125, -25.0703125, -21.9013671875, -18.732421875, -15.5634765625, -12.39453125, -9.2255859375, -6.056640625, -2.8876953125, 0.28125, 3.4501953125, 6.619140625, 9.7880859375, 12.95703125, 16.1259765625, 19.294921875, 22.4638671875, 25.6328125, 28.8017578125, 31.970703125, 35.1396484375, 38.30859375, 41.4775390625, 44.646484375, 47.8154296875, 50.984375, 54.1533203125, 57.322265625, 60.4912109375, 63.66015625, 66.8291015625, 69.998046875, 73.1669921875, 76.3359375, 79.5048828125, 82.673828125, 85.8427734375, 89.01171875, 92.1806640625, 95.349609375, 98.5185546875, 101.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 23.0, 83.0, 186.0, 327.0, 268.0, 78.0, 29.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.9048156738281, -404.8369140625, -395.76898193359375, -386.7010803222656, -377.6331481933594, -368.56524658203125, -359.497314453125, -350.4294128417969, -341.36151123046875, -332.2936096191406, -323.2256774902344, -314.15777587890625, -305.08984375, -296.0219421386719, -286.9540100097656, -277.8861083984375, -268.81817626953125, -259.7502746582031, -250.68234252929688, -241.6144256591797, -232.5465087890625, -223.47860717773438, -214.4106903076172, -205.3427734375, -196.2748565673828, -187.20693969726562, -178.13902282714844, -169.07110595703125, -160.00320434570312, -150.93527221679688, -141.86737060546875, -132.79945373535156, -123.73152160644531, -114.66360473632812, -105.59568786621094, -96.52777862548828, -87.4598617553711, -78.3919448852539, -69.32403564453125, -60.25611877441406, -51.188201904296875, -42.12028503417969, -33.052371978759766, -23.98445701599121, -14.916542053222656, -5.848625183105469, 3.219287872314453, 12.287200927734375, 21.355117797851562, 30.423032760620117, 39.49094772338867, 48.558860778808594, 57.62677764892578, 66.69469451904297, 75.76260375976562, 84.83052062988281, 93.8984375, 102.96635437011719, 112.03427124023438, 121.10218048095703, 130.17010498046875, 139.23800659179688, 148.30592346191406, 157.37384033203125, 166.44175720214844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 16.0, 16.0, 17.0, 22.0, 26.0, 27.0, 34.0, 25.0, 36.0, 34.0, 40.0, 63.0, 46.0, 64.0, 54.0, 38.0, 51.0, 42.0, 40.0, 38.0, 30.0, 41.0, 32.0, 24.0, 26.0, 21.0, 19.0, 10.0, 14.0, 7.0, 5.0, 4.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-102.3641586303711, -99.72129821777344, -97.07844543457031, -94.43558502197266, -91.792724609375, -89.14987182617188, -86.50701141357422, -83.86415100097656, -81.22129821777344, -78.57843780517578, -75.93558502197266, -73.292724609375, -70.64987182617188, -68.00701141357422, -65.36415100097656, -62.72129440307617, -60.07843780517578, -57.43558120727539, -54.792724609375, -52.149864196777344, -49.50700759887695, -46.86415100097656, -44.221290588378906, -41.578433990478516, -38.935577392578125, -36.292720794677734, -33.649864196777344, -31.007003784179688, -28.364147186279297, -25.721290588378906, -23.078432083129883, -20.43557357788086, -17.792709350585938, -15.14985179901123, -12.506994247436523, -9.864136695861816, -7.221279144287109, -4.578421592712402, -1.9355640411376953, 0.7072944641113281, 3.3501510620117188, 5.993008613586426, 8.635866165161133, 11.27872371673584, 13.921581268310547, 16.564437866210938, 19.20729637145996, 21.850154876708984, 24.493011474609375, 27.135868072509766, 29.77872657775879, 32.42158508300781, 35.0644416809082, 37.707298278808594, 40.35015869140625, 42.99301528930664, 45.63587188720703, 48.27872848510742, 50.92158508300781, 53.56444549560547, 56.20730209350586, 58.85015869140625, 61.493019104003906, 64.13587951660156, 66.77873229980469]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 7.0, 13.0, 38.0, 38.0, 70.0, 83.0, 119.0, 185.0, 288.0, 435.0, 612.0, 927.0, 1298.0, 2105.0, 2925.0, 4443.0, 6616.0, 10037.0, 15429.0, 23526.0, 36663.0, 57985.0, 94546.0, 162413.0, 228635.0, 152367.0, 90258.0, 54912.0, 35018.0, 22679.0, 14549.0, 9752.0, 6357.0, 4305.0, 2929.0, 1901.0, 1252.0, 919.0, 632.0, 421.0, 293.0, 185.0, 125.0, 82.0, 55.0, 44.0, 25.0, 20.0, 19.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2421875, -0.23423385620117188, -0.22628021240234375, -0.21832656860351562, -0.2103729248046875, -0.20241928100585938, -0.19446563720703125, -0.18651199340820312, -0.178558349609375, -0.17060470581054688, -0.16265106201171875, -0.15469741821289062, -0.1467437744140625, -0.13879013061523438, -0.13083648681640625, -0.12288284301757812, -0.11492919921875, -0.10697555541992188, -0.09902191162109375, -0.09106826782226562, -0.0831146240234375, -0.07516098022460938, -0.06720733642578125, -0.059253692626953125, -0.051300048828125, -0.043346405029296875, -0.03539276123046875, -0.027439117431640625, -0.0194854736328125, -0.011531829833984375, -0.00357818603515625, 0.004375457763671875, 0.0123291015625, 0.020282745361328125, 0.02823638916015625, 0.036190032958984375, 0.0441436767578125, 0.052097320556640625, 0.06005096435546875, 0.06800460815429688, 0.075958251953125, 0.08391189575195312, 0.09186553955078125, 0.09981918334960938, 0.1077728271484375, 0.11572647094726562, 0.12368011474609375, 0.13163375854492188, 0.13958740234375, 0.14754104614257812, 0.15549468994140625, 0.16344833374023438, 0.1714019775390625, 0.17935562133789062, 0.18730926513671875, 0.19526290893554688, 0.203216552734375, 0.21117019653320312, 0.21912384033203125, 0.22707748413085938, 0.2350311279296875, 0.24298477172851562, 0.25093841552734375, 0.2588920593261719, 0.266845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 9.0, 8.0, 14.0, 13.0, 15.0, 16.0, 15.0, 14.0, 20.0, 22.0, 30.0, 29.0, 36.0, 44.0, 41.0, 47.0, 39.0, 47.0, 42.0, 1073.0, 33.0, 51.0, 33.0, 32.0, 31.0, 32.0, 28.0, 28.0, 23.0, 19.0, 23.0, 28.0, 23.0, 15.0, 11.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.265625, -8.9947509765625, -8.723876953125, -8.4530029296875, -8.18212890625, -7.9112548828125, -7.640380859375, -7.3695068359375, -7.0986328125, -6.8277587890625, -6.556884765625, -6.2860107421875, -6.01513671875, -5.7442626953125, -5.473388671875, -5.2025146484375, -4.931640625, -4.6607666015625, -4.389892578125, -4.1190185546875, -3.84814453125, -3.5772705078125, -3.306396484375, -3.0355224609375, -2.7646484375, -2.4937744140625, -2.222900390625, -1.9520263671875, -1.68115234375, -1.4102783203125, -1.139404296875, -0.8685302734375, -0.59765625, -0.3267822265625, -0.055908203125, 0.2149658203125, 0.48583984375, 0.7567138671875, 1.027587890625, 1.2984619140625, 1.5693359375, 1.8402099609375, 2.111083984375, 2.3819580078125, 2.65283203125, 2.9237060546875, 3.194580078125, 3.4654541015625, 3.736328125, 4.0072021484375, 4.278076171875, 4.5489501953125, 4.81982421875, 5.0906982421875, 5.361572265625, 5.6324462890625, 5.9033203125, 6.1741943359375, 6.445068359375, 6.7159423828125, 6.98681640625, 7.2576904296875, 7.528564453125, 7.7994384765625, 8.0703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 13.0, 23.0, 29.0, 39.0, 64.0, 86.0, 101.0, 133.0, 204.0, 325.0, 452.0, 638.0, 959.0, 1282.0, 1958.0, 2712.0, 4097.0, 6002.0, 9216.0, 13708.0, 20504.0, 31385.0, 48777.0, 74989.0, 122619.0, 1209038.0, 222482.0, 116616.0, 72149.0, 46336.0, 30170.0, 19723.0, 12773.0, 8714.0, 5930.0, 4035.0, 2754.0, 1911.0, 1282.0, 882.0, 626.0, 426.0, 286.0, 212.0, 131.0, 102.0, 76.0, 54.0, 33.0, 24.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0], "bins": [-0.1263427734375, -0.12250804901123047, -0.11867332458496094, -0.1148386001586914, -0.11100387573242188, -0.10716915130615234, -0.10333442687988281, -0.09949970245361328, -0.09566497802734375, -0.09183025360107422, -0.08799552917480469, -0.08416080474853516, -0.08032608032226562, -0.0764913558959961, -0.07265663146972656, -0.06882190704345703, -0.0649871826171875, -0.06115245819091797, -0.05731773376464844, -0.053483009338378906, -0.049648284912109375, -0.045813560485839844, -0.04197883605957031, -0.03814411163330078, -0.03430938720703125, -0.03047466278076172, -0.026639938354492188, -0.022805213928222656, -0.018970489501953125, -0.015135765075683594, -0.011301040649414062, -0.007466316223144531, -0.003631591796875, 0.00020313262939453125, 0.0040378570556640625, 0.007872581481933594, 0.011707305908203125, 0.015542030334472656, 0.019376754760742188, 0.02321147918701172, 0.02704620361328125, 0.03088092803955078, 0.03471565246582031, 0.038550376892089844, 0.042385101318359375, 0.046219825744628906, 0.05005455017089844, 0.05388927459716797, 0.0577239990234375, 0.06155872344970703, 0.06539344787597656, 0.0692281723022461, 0.07306289672851562, 0.07689762115478516, 0.08073234558105469, 0.08456707000732422, 0.08840179443359375, 0.09223651885986328, 0.09607124328613281, 0.09990596771240234, 0.10374069213867188, 0.1075754165649414, 0.11141014099121094, 0.11524486541748047, 0.11907958984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 13.0, 7.0, 16.0, 17.0, 24.0, 13.0, 40.0, 33.0, 42.0, 46.0, 57.0, 51.0, 53.0, 79.0, 55.0, 62.0, 61.0, 51.0, 51.0, 28.0, 30.0, 20.0, 22.0, 21.0, 23.0, 20.0, 7.0, 9.0, 7.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007834434509277344, -0.0007560700178146362, -0.0007286965847015381, -0.0007013231515884399, -0.0006739497184753418, -0.0006465762853622437, -0.0006192028522491455, -0.0005918294191360474, -0.0005644559860229492, -0.0005370825529098511, -0.0005097091197967529, -0.0004823356866836548, -0.00045496225357055664, -0.0004275888204574585, -0.00040021538734436035, -0.0003728419542312622, -0.00034546852111816406, -0.0003180950880050659, -0.0002907216548919678, -0.00026334822177886963, -0.00023597478866577148, -0.00020860135555267334, -0.0001812279224395752, -0.00015385448932647705, -0.0001264810562133789, -9.910762310028076e-05, -7.173418998718262e-05, -4.436075687408447e-05, -1.6987323760986328e-05, 1.0386109352111816e-05, 3.775954246520996e-05, 6.51329755783081e-05, 9.250640869140625e-05, 0.0001198798418045044, 0.00014725327491760254, 0.00017462670803070068, 0.00020200014114379883, 0.00022937357425689697, 0.0002567470073699951, 0.00028412044048309326, 0.0003114938735961914, 0.00033886730670928955, 0.0003662407398223877, 0.00039361417293548584, 0.000420987606048584, 0.00044836103916168213, 0.0004757344722747803, 0.0005031079053878784, 0.0005304813385009766, 0.0005578547716140747, 0.0005852282047271729, 0.000612601637840271, 0.0006399750709533691, 0.0006673485040664673, 0.0006947219371795654, 0.0007220953702926636, 0.0007494688034057617, 0.0007768422365188599, 0.000804215669631958, 0.0008315891027450562, 0.0008589625358581543, 0.0008863359689712524, 0.0009137094020843506, 0.0009410828351974487, 0.0009684562683105469]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 3.0, 10.0, 9.0, 13.0, 27.0, 14.0, 31.0, 22.0, 32.0, 28.0, 64.0, 95.0, 194.0, 506.0, 4028.0, 1033124.0, 9130.0, 632.0, 205.0, 98.0, 58.0, 45.0, 48.0, 16.0, 24.0, 16.0, 15.0, 9.0, 11.0, 8.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0225067138671875, -0.021874189376831055, -0.02124166488647461, -0.020609140396118164, -0.01997661590576172, -0.019344091415405273, -0.018711566925048828, -0.018079042434692383, -0.017446517944335938, -0.016813993453979492, -0.016181468963623047, -0.015548944473266602, -0.014916419982910156, -0.014283895492553711, -0.013651371002197266, -0.01301884651184082, -0.012386322021484375, -0.01175379753112793, -0.011121273040771484, -0.010488748550415039, -0.009856224060058594, -0.009223699569702148, -0.008591175079345703, -0.007958650588989258, -0.0073261260986328125, -0.006693601608276367, -0.006061077117919922, -0.0054285526275634766, -0.004796028137207031, -0.004163503646850586, -0.0035309791564941406, -0.0028984546661376953, -0.00226593017578125, -0.0016334056854248047, -0.0010008811950683594, -0.00036835670471191406, 0.00026416778564453125, 0.0008966922760009766, 0.0015292167663574219, 0.002161741256713867, 0.0027942657470703125, 0.003426790237426758, 0.004059314727783203, 0.0046918392181396484, 0.005324363708496094, 0.005956888198852539, 0.006589412689208984, 0.00722193717956543, 0.007854461669921875, 0.00848698616027832, 0.009119510650634766, 0.009752035140991211, 0.010384559631347656, 0.011017084121704102, 0.011649608612060547, 0.012282133102416992, 0.012914657592773438, 0.013547182083129883, 0.014179706573486328, 0.014812231063842773, 0.015444755554199219, 0.016077280044555664, 0.01670980453491211, 0.017342329025268555, 0.017974853515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 305.0, 707.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022845227271318436, -0.02241465635597706, -0.02198408544063568, -0.021553512662649155, -0.021122941747307777, -0.0206923708319664, -0.020261799916625023, -0.019831229001283646, -0.01940065808594227, -0.01897008717060089, -0.018539516255259514, -0.018108945339918137, -0.01767837256193161, -0.017247801646590233, -0.016817230731248856, -0.01638665981590748, -0.0159560889005661, -0.015525517985224724, -0.015094946138560772, -0.014664375223219395, -0.014233804307878017, -0.013803232461214066, -0.013372661545872688, -0.012942090630531311, -0.012511517852544785, -0.012080946937203407, -0.011650375090539455, -0.011219804175198078, -0.010789233259856701, -0.010358661413192749, -0.009928090497851372, -0.009497519582509995, -0.009066947735846043, -0.008636376820504665, -0.008205804973840714, -0.007775234058499336, -0.007344663143157959, -0.006914091762155294, -0.00648352038115263, -0.006052949465811253, -0.005622378084808588, -0.0051918067038059235, -0.004761235788464546, -0.004330664407461882, -0.0039000932592898607, -0.00346952211111784, -0.0030389507301151752, -0.0026083795819431543, -0.0021778084337711334, -0.0017472372855991125, -0.0013166660210117698, -0.000886094756424427, -0.0004555236082524061, -2.4952460080385208e-05, 0.00040561892092227936, 0.0008361900690943003, 0.0012667612172663212, 0.001697332365438342, 0.002127903513610363, 0.0025584748946130276, 0.0029890460427850485, 0.0034196171909570694, 0.003850188571959734, 0.0042807599529623985, 0.004711330868303776]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 13.0, 16.0, 9.0, 22.0, 25.0, 22.0, 30.0, 41.0, 31.0, 39.0, 54.0, 34.0, 63.0, 53.0, 39.0, 52.0, 55.0, 54.0, 33.0, 30.0, 41.0, 32.0, 35.0, 20.0, 20.0, 27.0, 19.0, 19.0, 17.0, 9.0, 12.0, 4.0, 7.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007668137550354004, -0.0007376745343208313, -0.0007085353136062622, -0.0006793960928916931, -0.000650256872177124, -0.0006211176514625549, -0.0005919784307479858, -0.0005628392100334167, -0.0005336999893188477, -0.0005045607686042786, -0.00047542154788970947, -0.0004462823271751404, -0.0004171431064605713, -0.0003880038857460022, -0.0003588646650314331, -0.000329725444316864, -0.0003005862236022949, -0.00027144700288772583, -0.00024230778217315674, -0.00021316856145858765, -0.00018402934074401855, -0.00015489012002944946, -0.00012575089931488037, -9.661167860031128e-05, -6.747245788574219e-05, -3.8333237171173096e-05, -9.194016456604004e-06, 1.9945204257965088e-05, 4.908442497253418e-05, 7.822364568710327e-05, 0.00010736286640167236, 0.00013650208711624146, 0.00016564130783081055, 0.00019478052854537964, 0.00022391974925994873, 0.0002530589699745178, 0.0002821981906890869, 0.000311337411403656, 0.0003404766321182251, 0.0003696158528327942, 0.0003987550735473633, 0.0004278942942619324, 0.00045703351497650146, 0.00048617273569107056, 0.0005153119564056396, 0.0005444511771202087, 0.0005735903978347778, 0.0006027296185493469, 0.000631868839263916, 0.0006610080599784851, 0.0006901472806930542, 0.0007192865014076233, 0.0007484257221221924, 0.0007775649428367615, 0.0008067041635513306, 0.0008358433842658997, 0.0008649826049804688, 0.0008941218256950378, 0.0009232610464096069, 0.000952400267124176, 0.0009815394878387451, 0.0010106787085533142, 0.0010398179292678833, 0.0010689571499824524, 0.0010980963706970215]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 11.0, 11.0, 19.0, 23.0, 45.0, 54.0, 79.0, 106.0, 149.0, 172.0, 232.0, 339.0, 483.0, 698.0, 1030.0, 1402.0, 2091.0, 3260.0, 4902.0, 8415.0, 16188.0, 39790.0, 139154.0, 623795.0, 129454.0, 37939.0, 15742.0, 8023.0, 4955.0, 3124.0, 2086.0, 1351.0, 961.0, 699.0, 482.0, 352.0, 231.0, 187.0, 141.0, 91.0, 76.0, 43.0, 35.0, 31.0, 20.0, 18.0, 19.0, 4.0, 14.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.3984375, -12.9727783203125, -12.547119140625, -12.1214599609375, -11.69580078125, -11.2701416015625, -10.844482421875, -10.4188232421875, -9.9931640625, -9.5675048828125, -9.141845703125, -8.7161865234375, -8.29052734375, -7.8648681640625, -7.439208984375, -7.0135498046875, -6.587890625, -6.1622314453125, -5.736572265625, -5.3109130859375, -4.88525390625, -4.4595947265625, -4.033935546875, -3.6082763671875, -3.1826171875, -2.7569580078125, -2.331298828125, -1.9056396484375, -1.47998046875, -1.0543212890625, -0.628662109375, -0.2030029296875, 0.22265625, 0.6483154296875, 1.073974609375, 1.4996337890625, 1.92529296875, 2.3509521484375, 2.776611328125, 3.2022705078125, 3.6279296875, 4.0535888671875, 4.479248046875, 4.9049072265625, 5.33056640625, 5.7562255859375, 6.181884765625, 6.6075439453125, 7.033203125, 7.4588623046875, 7.884521484375, 8.3101806640625, 8.73583984375, 9.1614990234375, 9.587158203125, 10.0128173828125, 10.4384765625, 10.8641357421875, 11.289794921875, 11.7154541015625, 12.14111328125, 12.5667724609375, 12.992431640625, 13.4180908203125, 13.84375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 14.0, 9.0, 19.0, 20.0, 21.0, 21.0, 19.0, 30.0, 21.0, 33.0, 42.0, 38.0, 50.0, 50.0, 91.0, 177.0, 1736.0, 150.0, 68.0, 48.0, 48.0, 35.0, 39.0, 36.0, 25.0, 31.0, 29.0, 26.0, 23.0, 18.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.73095703125, -35.5244140625, -34.31787109375, -33.111328125, -31.90478515625, -30.6982421875, -29.49169921875, -28.28515625, -27.07861328125, -25.8720703125, -24.66552734375, -23.458984375, -22.25244140625, -21.0458984375, -19.83935546875, -18.6328125, -17.42626953125, -16.2197265625, -15.01318359375, -13.806640625, -12.60009765625, -11.3935546875, -10.18701171875, -8.98046875, -7.77392578125, -6.5673828125, -5.36083984375, -4.154296875, -2.94775390625, -1.7412109375, -0.53466796875, 0.671875, 1.87841796875, 3.0849609375, 4.29150390625, 5.498046875, 6.70458984375, 7.9111328125, 9.11767578125, 10.32421875, 11.53076171875, 12.7373046875, 13.94384765625, 15.150390625, 16.35693359375, 17.5634765625, 18.77001953125, 19.9765625, 21.18310546875, 22.3896484375, 23.59619140625, 24.802734375, 26.00927734375, 27.2158203125, 28.42236328125, 29.62890625, 30.83544921875, 32.0419921875, 33.24853515625, 34.455078125, 35.66162109375, 36.8681640625, 38.07470703125, 39.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 14.0, 17.0, 21.0, 29.0, 31.0, 34.0, 45.0, 50.0, 91.0, 140.0, 146.0, 229.0, 645.0, 2103.0, 13423.0, 2467508.0, 647140.0, 10784.0, 1814.0, 515.0, 238.0, 146.0, 115.0, 86.0, 49.0, 48.0, 39.0, 37.0, 31.0, 35.0, 11.0, 9.0, 13.0, 10.0, 8.0, 4.0, 7.0, 5.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.8125, -86.271484375, -83.73046875, -81.189453125, -78.6484375, -76.107421875, -73.56640625, -71.025390625, -68.484375, -65.943359375, -63.40234375, -60.861328125, -58.3203125, -55.779296875, -53.23828125, -50.697265625, -48.15625, -45.615234375, -43.07421875, -40.533203125, -37.9921875, -35.451171875, -32.91015625, -30.369140625, -27.828125, -25.287109375, -22.74609375, -20.205078125, -17.6640625, -15.123046875, -12.58203125, -10.041015625, -7.5, -4.958984375, -2.41796875, 0.123046875, 2.6640625, 5.205078125, 7.74609375, 10.287109375, 12.828125, 15.369140625, 17.91015625, 20.451171875, 22.9921875, 25.533203125, 28.07421875, 30.615234375, 33.15625, 35.697265625, 38.23828125, 40.779296875, 43.3203125, 45.861328125, 48.40234375, 50.943359375, 53.484375, 56.025390625, 58.56640625, 61.107421875, 63.6484375, 66.189453125, 68.73046875, 71.271484375, 73.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 42.0, 218.0, 542.0, 161.0, 36.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.95651245117188, -108.3705062866211, -101.78450012207031, -95.19850158691406, -88.61249542236328, -82.0264892578125, -75.44048309326172, -68.85447692871094, -62.26847457885742, -55.68246841430664, -49.096466064453125, -42.510459899902344, -35.92445373535156, -29.338451385498047, -22.752445220947266, -16.16644287109375, -9.580436706542969, -2.994431972503662, 3.5915727615356445, 10.17757797241211, 16.763582229614258, 23.349586486816406, 29.935592651367188, 36.5215950012207, 43.107601165771484, 49.693607330322266, 56.27960968017578, 62.86561584472656, 69.45162200927734, 76.03762817382812, 82.62362670898438, 89.20963287353516, 95.79563903808594, 102.38164520263672, 108.9676513671875, 115.55364990234375, 122.13965606689453, 128.7256622314453, 135.31167602539062, 141.89767456054688, 148.48367309570312, 155.06967163085938, 161.6556854248047, 168.24168395996094, 174.82769775390625, 181.4136962890625, 187.99969482421875, 194.58570861816406, 201.17172241210938, 207.75772094726562, 214.34373474121094, 220.9297332763672, 227.5157470703125, 234.10174560546875, 240.687744140625, 247.2737579345703, 253.85975646972656, 260.4457702636719, 267.0317687988281, 273.6177673339844, 280.2037658691406, 286.789794921875, 293.37579345703125, 299.9617919921875, 306.54779052734375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 6.0, 11.0, 14.0, 11.0, 8.0, 7.0, 14.0, 12.0, 39.0, 31.0, 39.0, 25.0, 37.0, 41.0, 44.0, 44.0, 42.0, 43.0, 43.0, 43.0, 35.0, 41.0, 35.0, 47.0, 27.0, 38.0, 35.0, 18.0, 21.0, 18.0, 22.0, 13.0, 18.0, 17.0, 11.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.6780776977539, -85.90892791748047, -83.13977813720703, -80.37063598632812, -77.60148620605469, -74.83233642578125, -72.06318664550781, -69.29403686523438, -66.52489471435547, -63.75574493408203, -60.98659896850586, -58.21744918823242, -55.44830322265625, -52.67915344238281, -49.910003662109375, -47.1408576965332, -44.371707916259766, -41.60255813598633, -38.833412170410156, -36.06426239013672, -33.29511642456055, -30.52596664428711, -27.756818771362305, -24.9876708984375, -22.218523025512695, -19.44937515258789, -16.680227279663086, -13.911078453063965, -11.14193058013916, -8.372782707214355, -5.603633880615234, -2.8344860076904297, -0.065338134765625, 2.703809976577759, 5.472958087921143, 8.242106437683105, 11.01125431060791, 13.780402183532715, 16.549551010131836, 19.31869888305664, 22.087846755981445, 24.85699462890625, 27.626142501831055, 30.39529037475586, 33.1644401550293, 35.93358612060547, 38.702735900878906, 41.471885681152344, 44.241031646728516, 47.01018142700195, 49.779327392578125, 52.54847717285156, 55.317623138427734, 58.08677291870117, 60.855918884277344, 63.62506866455078, 66.39421844482422, 69.16336822509766, 71.9325180053711, 74.70166015625, 77.47080993652344, 80.23995971679688, 83.00910949707031, 85.77825927734375, 88.54740142822266]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 6.0, 15.0, 14.0, 16.0, 16.0, 18.0, 15.0, 26.0, 25.0, 34.0, 44.0, 44.0, 45.0, 47.0, 46.0, 34.0, 51.0, 50.0, 46.0, 38.0, 34.0, 41.0, 47.0, 39.0, 29.0, 30.0, 23.0, 25.0, 11.0, 15.0, 11.0, 9.0, 8.0, 3.0, 9.0, 5.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.604736328125, -11.21728515625, -10.829833984375, -10.4423828125, -10.054931640625, -9.66748046875, -9.280029296875, -8.892578125, -8.505126953125, -8.11767578125, -7.730224609375, -7.3427734375, -6.955322265625, -6.56787109375, -6.180419921875, -5.79296875, -5.405517578125, -5.01806640625, -4.630615234375, -4.2431640625, -3.855712890625, -3.46826171875, -3.080810546875, -2.693359375, -2.305908203125, -1.91845703125, -1.531005859375, -1.1435546875, -0.756103515625, -0.36865234375, 0.018798828125, 0.40625, 0.793701171875, 1.18115234375, 1.568603515625, 1.9560546875, 2.343505859375, 2.73095703125, 3.118408203125, 3.505859375, 3.893310546875, 4.28076171875, 4.668212890625, 5.0556640625, 5.443115234375, 5.83056640625, 6.218017578125, 6.60546875, 6.992919921875, 7.38037109375, 7.767822265625, 8.1552734375, 8.542724609375, 8.93017578125, 9.317626953125, 9.705078125, 10.092529296875, 10.47998046875, 10.867431640625, 11.2548828125, 11.642333984375, 12.02978515625, 12.417236328125, 12.8046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 13.0, 20.0, 21.0, 20.0, 26.0, 34.0, 64.0, 78.0, 139.0, 218.0, 429.0, 935.0, 2282.0, 6164.0, 19801.0, 146059.0, 3074374.0, 883168.0, 42907.0, 10812.0, 3701.0, 1376.0, 688.0, 365.0, 181.0, 113.0, 62.0, 59.0, 40.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 9.0, 7.0, 4.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.85986328125, -33.6884765625, -32.51708984375, -31.345703125, -30.17431640625, -29.0029296875, -27.83154296875, -26.66015625, -25.48876953125, -24.3173828125, -23.14599609375, -21.974609375, -20.80322265625, -19.6318359375, -18.46044921875, -17.2890625, -16.11767578125, -14.9462890625, -13.77490234375, -12.603515625, -11.43212890625, -10.2607421875, -9.08935546875, -7.91796875, -6.74658203125, -5.5751953125, -4.40380859375, -3.232421875, -2.06103515625, -0.8896484375, 0.28173828125, 1.453125, 2.62451171875, 3.7958984375, 4.96728515625, 6.138671875, 7.31005859375, 8.4814453125, 9.65283203125, 10.82421875, 11.99560546875, 13.1669921875, 14.33837890625, 15.509765625, 16.68115234375, 17.8525390625, 19.02392578125, 20.1953125, 21.36669921875, 22.5380859375, 23.70947265625, 24.880859375, 26.05224609375, 27.2236328125, 28.39501953125, 29.56640625, 30.73779296875, 31.9091796875, 33.08056640625, 34.251953125, 35.42333984375, 36.5947265625, 37.76611328125, 38.9375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 7.0, 8.0, 17.0, 19.0, 15.0, 27.0, 30.0, 31.0, 53.0, 75.0, 101.0, 126.0, 261.0, 485.0, 740.0, 748.0, 520.0, 302.0, 144.0, 103.0, 65.0, 40.0, 37.0, 23.0, 21.0, 10.0, 15.0, 9.0, 9.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.78125, -25.001708984375, -24.22216796875, -23.442626953125, -22.6630859375, -21.883544921875, -21.10400390625, -20.324462890625, -19.544921875, -18.765380859375, -17.98583984375, -17.206298828125, -16.4267578125, -15.647216796875, -14.86767578125, -14.088134765625, -13.30859375, -12.529052734375, -11.74951171875, -10.969970703125, -10.1904296875, -9.410888671875, -8.63134765625, -7.851806640625, -7.072265625, -6.292724609375, -5.51318359375, -4.733642578125, -3.9541015625, -3.174560546875, -2.39501953125, -1.615478515625, -0.8359375, -0.056396484375, 0.72314453125, 1.502685546875, 2.2822265625, 3.061767578125, 3.84130859375, 4.620849609375, 5.400390625, 6.179931640625, 6.95947265625, 7.739013671875, 8.5185546875, 9.298095703125, 10.07763671875, 10.857177734375, 11.63671875, 12.416259765625, 13.19580078125, 13.975341796875, 14.7548828125, 15.534423828125, 16.31396484375, 17.093505859375, 17.873046875, 18.652587890625, 19.43212890625, 20.211669921875, 20.9912109375, 21.770751953125, 22.55029296875, 23.329833984375, 24.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 12.0, 13.0, 22.0, 25.0, 29.0, 51.0, 76.0, 142.0, 309.0, 1206.0, 13398.0, 3166538.0, 1001611.0, 9165.0, 966.0, 221.0, 145.0, 84.0, 56.0, 36.0, 29.0, 32.0, 19.0, 16.0, 15.0, 10.0, 8.0, 1.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.375, -113.5810546875, -109.787109375, -105.9931640625, -102.19921875, -98.4052734375, -94.611328125, -90.8173828125, -87.0234375, -83.2294921875, -79.435546875, -75.6416015625, -71.84765625, -68.0537109375, -64.259765625, -60.4658203125, -56.671875, -52.8779296875, -49.083984375, -45.2900390625, -41.49609375, -37.7021484375, -33.908203125, -30.1142578125, -26.3203125, -22.5263671875, -18.732421875, -14.9384765625, -11.14453125, -7.3505859375, -3.556640625, 0.2373046875, 4.03125, 7.8251953125, 11.619140625, 15.4130859375, 19.20703125, 23.0009765625, 26.794921875, 30.5888671875, 34.3828125, 38.1767578125, 41.970703125, 45.7646484375, 49.55859375, 53.3525390625, 57.146484375, 60.9404296875, 64.734375, 68.5283203125, 72.322265625, 76.1162109375, 79.91015625, 83.7041015625, 87.498046875, 91.2919921875, 95.0859375, 98.8798828125, 102.673828125, 106.4677734375, 110.26171875, 114.0556640625, 117.849609375, 121.6435546875, 125.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 23.0, 57.0, 90.0, 157.0, 195.0, 201.0, 145.0, 75.0, 27.0, 19.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.41262817382812, -127.2995834350586, -122.1865463256836, -117.07350158691406, -111.96046447753906, -106.84741973876953, -101.734375, -96.621337890625, -91.50829315185547, -86.39524841308594, -81.28221130371094, -76.1691665649414, -71.05612182617188, -65.94308471679688, -60.830039978027344, -55.71699905395508, -50.60395812988281, -45.49091720581055, -40.37787628173828, -35.26483154296875, -30.151790618896484, -25.03874969482422, -19.92570686340332, -14.812664031982422, -9.699623107910156, -4.586581230163574, 0.5264606475830078, 5.63950252532959, 10.752544403076172, 15.865585327148438, 20.978628158569336, 26.091670989990234, 31.204696655273438, 36.3177375793457, 41.43077850341797, 46.5438232421875, 51.656864166259766, 56.76990509033203, 61.88294982910156, 66.99598693847656, 72.1090316772461, 77.22207641601562, 82.33511352539062, 87.44815826416016, 92.56120300292969, 97.67424011230469, 102.78728485107422, 107.90032958984375, 113.01336669921875, 118.12641143798828, 123.23944854736328, 128.3524932861328, 133.4655303955078, 138.57858276367188, 143.69161987304688, 148.80465698242188, 153.91769409179688, 159.03073120117188, 164.14378356933594, 169.25682067871094, 174.36985778808594, 179.48291015625, 184.595947265625, 189.708984375, 194.82203674316406]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 14.0, 16.0, 24.0, 22.0, 29.0, 35.0, 32.0, 40.0, 27.0, 39.0, 41.0, 50.0, 49.0, 39.0, 57.0, 45.0, 37.0, 48.0, 38.0, 28.0, 38.0, 37.0, 29.0, 29.0, 21.0, 18.0, 12.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.47439575195312, -73.06916046142578, -70.66392517089844, -68.25869750976562, -65.85346221923828, -63.44822692871094, -61.042991638183594, -58.63775634765625, -56.23252487182617, -53.82728958129883, -51.42205810546875, -49.016822814941406, -46.61158752441406, -44.206356048583984, -41.80112075805664, -39.39588928222656, -36.99065399169922, -34.585418701171875, -32.1801872253418, -29.774951934814453, -27.369718551635742, -24.96448516845703, -22.559249877929688, -20.154016494750977, -17.748783111572266, -15.343549728393555, -12.938315391540527, -10.5330810546875, -8.127847671508789, -5.722614288330078, -3.317379951477051, -0.9121456146240234, 1.4930877685546875, 3.8983216285705566, 6.303555488586426, 8.708789825439453, 11.114023208618164, 13.519256591796875, 15.924490928649902, 18.32972526550293, 20.73495864868164, 23.14019203186035, 25.545425415039062, 27.950660705566406, 30.355894088745117, 32.76112747192383, 35.16636276245117, 37.57159423828125, 39.976829528808594, 42.38206481933594, 44.787296295166016, 47.19253158569336, 49.59776306152344, 52.00299835205078, 54.408233642578125, 56.81346893310547, 59.21870040893555, 61.62393569946289, 64.02916717529297, 66.43440246582031, 68.83963775634766, 71.244873046875, 73.65010070800781, 76.05533599853516, 78.4605712890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 5.0, 7.0, 6.0, 10.0, 21.0, 16.0, 24.0, 33.0, 53.0, 71.0, 95.0, 142.0, 201.0, 291.0, 405.0, 548.0, 774.0, 1119.0, 1524.0, 2302.0, 3233.0, 4731.0, 6505.0, 9760.0, 14520.0, 21567.0, 32333.0, 49374.0, 75475.0, 116719.0, 186003.0, 183837.0, 115538.0, 74450.0, 48511.0, 31814.0, 21155.0, 14196.0, 9511.0, 6533.0, 4583.0, 3167.0, 2176.0, 1509.0, 1064.0, 790.0, 559.0, 368.0, 272.0, 174.0, 151.0, 111.0, 68.0, 38.0, 41.0, 28.0, 19.0, 18.0, 9.0, 7.0, 5.0, 2.0], "bins": [-0.2447509765625, -0.23732948303222656, -0.22990798950195312, -0.2224864959716797, -0.21506500244140625, -0.2076435089111328, -0.20022201538085938, -0.19280052185058594, -0.1853790283203125, -0.17795753479003906, -0.17053604125976562, -0.1631145477294922, -0.15569305419921875, -0.1482715606689453, -0.14085006713867188, -0.13342857360839844, -0.126007080078125, -0.11858558654785156, -0.11116409301757812, -0.10374259948730469, -0.09632110595703125, -0.08889961242675781, -0.08147811889648438, -0.07405662536621094, -0.0666351318359375, -0.05921363830566406, -0.051792144775390625, -0.04437065124511719, -0.03694915771484375, -0.029527664184570312, -0.022106170654296875, -0.014684677124023438, -0.00726318359375, 0.0001583099365234375, 0.007579803466796875, 0.015001296997070312, 0.02242279052734375, 0.029844284057617188, 0.037265777587890625, 0.04468727111816406, 0.0521087646484375, 0.05953025817871094, 0.06695175170898438, 0.07437324523925781, 0.08179473876953125, 0.08921623229980469, 0.09663772583007812, 0.10405921936035156, 0.111480712890625, 0.11890220642089844, 0.12632369995117188, 0.1337451934814453, 0.14116668701171875, 0.1485881805419922, 0.15600967407226562, 0.16343116760253906, 0.1708526611328125, 0.17827415466308594, 0.18569564819335938, 0.1931171417236328, 0.20053863525390625, 0.2079601287841797, 0.21538162231445312, 0.22280311584472656, 0.230224609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 7.0, 9.0, 13.0, 23.0, 20.0, 23.0, 36.0, 25.0, 29.0, 43.0, 30.0, 45.0, 29.0, 35.0, 45.0, 1067.0, 49.0, 52.0, 39.0, 46.0, 41.0, 35.0, 35.0, 22.0, 38.0, 18.0, 27.0, 27.0, 16.0, 20.0, 13.0, 14.0, 10.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9605712890625, -7.671142578125, -7.3817138671875, -7.09228515625, -6.8028564453125, -6.513427734375, -6.2239990234375, -5.9345703125, -5.6451416015625, -5.355712890625, -5.0662841796875, -4.77685546875, -4.4874267578125, -4.197998046875, -3.9085693359375, -3.619140625, -3.3297119140625, -3.040283203125, -2.7508544921875, -2.46142578125, -2.1719970703125, -1.882568359375, -1.5931396484375, -1.3037109375, -1.0142822265625, -0.724853515625, -0.4354248046875, -0.14599609375, 0.1434326171875, 0.432861328125, 0.7222900390625, 1.01171875, 1.3011474609375, 1.590576171875, 1.8800048828125, 2.16943359375, 2.4588623046875, 2.748291015625, 3.0377197265625, 3.3271484375, 3.6165771484375, 3.906005859375, 4.1954345703125, 4.48486328125, 4.7742919921875, 5.063720703125, 5.3531494140625, 5.642578125, 5.9320068359375, 6.221435546875, 6.5108642578125, 6.80029296875, 7.0897216796875, 7.379150390625, 7.6685791015625, 7.9580078125, 8.2474365234375, 8.536865234375, 8.8262939453125, 9.11572265625, 9.4051513671875, 9.694580078125, 9.9840087890625, 10.2734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 9.0, 23.0, 33.0, 70.0, 78.0, 118.0, 152.0, 250.0, 358.0, 491.0, 809.0, 1132.0, 1786.0, 2546.0, 3868.0, 6008.0, 9198.0, 14203.0, 21965.0, 34272.0, 53427.0, 84543.0, 139063.0, 1259097.0, 173519.0, 106158.0, 66261.0, 41833.0, 26542.0, 17115.0, 10950.0, 7101.0, 4689.0, 3031.0, 2082.0, 1374.0, 949.0, 629.0, 448.0, 294.0, 207.0, 146.0, 96.0, 64.0, 44.0, 34.0, 19.0, 11.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1217041015625, -0.11761093139648438, -0.11351776123046875, -0.10942459106445312, -0.1053314208984375, -0.10123825073242188, -0.09714508056640625, -0.09305191040039062, -0.088958740234375, -0.08486557006835938, -0.08077239990234375, -0.07667922973632812, -0.0725860595703125, -0.06849288940429688, -0.06439971923828125, -0.060306549072265625, -0.05621337890625, -0.052120208740234375, -0.04802703857421875, -0.043933868408203125, -0.0398406982421875, -0.035747528076171875, -0.03165435791015625, -0.027561187744140625, -0.023468017578125, -0.019374847412109375, -0.01528167724609375, -0.011188507080078125, -0.0070953369140625, -0.003002166748046875, 0.00109100341796875, 0.005184173583984375, 0.00927734375, 0.013370513916015625, 0.01746368408203125, 0.021556854248046875, 0.0256500244140625, 0.029743194580078125, 0.03383636474609375, 0.037929534912109375, 0.042022705078125, 0.046115875244140625, 0.05020904541015625, 0.054302215576171875, 0.0583953857421875, 0.062488555908203125, 0.06658172607421875, 0.07067489624023438, 0.07476806640625, 0.07886123657226562, 0.08295440673828125, 0.08704757690429688, 0.0911407470703125, 0.09523391723632812, 0.09932708740234375, 0.10342025756835938, 0.107513427734375, 0.11160659790039062, 0.11569976806640625, 0.11979293823242188, 0.1238861083984375, 0.12797927856445312, 0.13207244873046875, 0.13616561889648438, 0.1402587890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 3.0, 14.0, 12.0, 19.0, 13.0, 24.0, 31.0, 44.0, 45.0, 71.0, 96.0, 85.0, 100.0, 76.0, 70.0, 64.0, 33.0, 42.0, 28.0, 20.0, 23.0, 16.0, 12.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011749267578125, -0.0011394768953323364, -0.0011040270328521729, -0.0010685771703720093, -0.0010331273078918457, -0.0009976774454116821, -0.0009622275829315186, -0.000926777720451355, -0.0008913278579711914, -0.0008558779954910278, -0.0008204281330108643, -0.0007849782705307007, -0.0007495284080505371, -0.0007140785455703735, -0.00067862868309021, -0.0006431788206100464, -0.0006077289581298828, -0.0005722790956497192, -0.0005368292331695557, -0.0005013793706893921, -0.0004659295082092285, -0.00043047964572906494, -0.00039502978324890137, -0.0003595799207687378, -0.0003241300582885742, -0.00028868019580841064, -0.00025323033332824707, -0.0002177804708480835, -0.00018233060836791992, -0.00014688074588775635, -0.00011143088340759277, -7.59810209274292e-05, -4.0531158447265625e-05, -5.081295967102051e-06, 3.0368566513061523e-05, 6.58184289932251e-05, 0.00010126829147338867, 0.00013671815395355225, 0.00017216801643371582, 0.0002076178789138794, 0.00024306774139404297, 0.00027851760387420654, 0.0003139674663543701, 0.0003494173288345337, 0.00038486719131469727, 0.00042031705379486084, 0.0004557669162750244, 0.000491216778755188, 0.0005266666412353516, 0.0005621165037155151, 0.0005975663661956787, 0.0006330162286758423, 0.0006684660911560059, 0.0007039159536361694, 0.000739365816116333, 0.0007748156785964966, 0.0008102655410766602, 0.0008457154035568237, 0.0008811652660369873, 0.0009166151285171509, 0.0009520649909973145, 0.000987514853477478, 0.0010229647159576416, 0.0010584145784378052, 0.0010938644409179688]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 7.0, 11.0, 12.0, 17.0, 21.0, 23.0, 29.0, 52.0, 54.0, 121.0, 276.0, 1337.0, 1016373.0, 29138.0, 600.0, 183.0, 79.0, 55.0, 36.0, 23.0, 16.0, 19.0, 11.0, 15.0, 2.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255584716796875, -0.02472853660583496, -0.023898601531982422, -0.023068666458129883, -0.022238731384277344, -0.021408796310424805, -0.020578861236572266, -0.019748926162719727, -0.018918991088867188, -0.01808905601501465, -0.01725912094116211, -0.01642918586730957, -0.015599250793457031, -0.014769315719604492, -0.013939380645751953, -0.013109445571899414, -0.012279510498046875, -0.011449575424194336, -0.010619640350341797, -0.009789705276489258, -0.008959770202636719, -0.00812983512878418, -0.007299900054931641, -0.0064699649810791016, -0.0056400299072265625, -0.0048100948333740234, -0.003980159759521484, -0.0031502246856689453, -0.0023202896118164062, -0.0014903545379638672, -0.0006604194641113281, 0.00016951560974121094, 0.00099945068359375, 0.001829385757446289, 0.002659320831298828, 0.003489255905151367, 0.004319190979003906, 0.005149126052856445, 0.005979061126708984, 0.0068089962005615234, 0.0076389312744140625, 0.008468866348266602, 0.00929880142211914, 0.01012873649597168, 0.010958671569824219, 0.011788606643676758, 0.012618541717529297, 0.013448476791381836, 0.014278411865234375, 0.015108346939086914, 0.015938282012939453, 0.016768217086791992, 0.01759815216064453, 0.01842808723449707, 0.01925802230834961, 0.02008795738220215, 0.020917892456054688, 0.021747827529907227, 0.022577762603759766, 0.023407697677612305, 0.024237632751464844, 0.025067567825317383, 0.025897502899169922, 0.02672743797302246, 0.027557373046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 29.0, 973.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02001454494893551, -0.01960132271051407, -0.01918810047209263, -0.018774880096316338, -0.018361657857894897, -0.017948435619473457, -0.017535213381052017, -0.017121993005275726, -0.016708770766854286, -0.016295548528432846, -0.015882326290011406, -0.01546910498291254, -0.015055883675813675, -0.014642661437392235, -0.01422944013029337, -0.01381621789187193, -0.013402996584773064, -0.012989774346351624, -0.012576553039252758, -0.012163330800831318, -0.011750109493732452, -0.011336887255311012, -0.010923665948212147, -0.010510443709790707, -0.010097221471369267, -0.009683999232947826, -0.009270777925848961, -0.00885755568742752, -0.008444334380328655, -0.008031112141907215, -0.00761789083480835, -0.0072046685963869095, -0.006791446823626757, -0.006378225050866604, -0.005965003278106451, -0.005551781505346298, -0.005138559732586145, -0.004725337959825993, -0.0043121157214045525, -0.0038988941814750433, -0.0034856724087148905, -0.0030724506359547377, -0.002659228863194585, -0.0022460068576037884, -0.0018327852012589574, -0.0014195633120834827, -0.00100634153932333, -0.0005931197665631771, -0.0001798979938030243, 0.00023332380806095898, 0.0006465456099249423, 0.001059767440892756, 0.0014729892136529088, 0.0018862111028283834, 0.0022994328755885363, 0.002712654648348689, 0.003125876421108842, 0.0035390981938689947, 0.003952320199459791, 0.004365541972219944, 0.004778763744980097, 0.00519198551774025, 0.0056052072905004025, 0.006018429063260555, 0.006431650836020708]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 13.0, 13.0, 15.0, 18.0, 27.0, 27.0, 28.0, 45.0, 43.0, 45.0, 55.0, 43.0, 57.0, 52.0, 70.0, 61.0, 59.0, 53.0, 52.0, 38.0, 33.0, 38.0, 29.0, 22.0, 22.0, 13.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008541345596313477, -0.000818164087831974, -0.0007821936160326004, -0.0007462231442332268, -0.0007102526724338531, -0.0006742822006344795, -0.0006383117288351059, -0.0006023412570357323, -0.0005663707852363586, -0.000530400313436985, -0.0004944298416376114, -0.00045845936983823776, -0.00042248889803886414, -0.0003865184262394905, -0.0003505479544401169, -0.00031457748264074326, -0.00027860701084136963, -0.000242636539041996, -0.00020666606724262238, -0.00017069559544324875, -0.00013472512364387512, -9.87546518445015e-05, -6.278418004512787e-05, -2.6813708245754242e-05, 9.156763553619385e-06, 4.512723535299301e-05, 8.109770715236664e-05, 0.00011706817895174026, 0.0001530386507511139, 0.00018900912255048752, 0.00022497959434986115, 0.00026095006614923477, 0.0002969205379486084, 0.000332891009747982, 0.00036886148154735565, 0.0004048319533467293, 0.0004408024251461029, 0.00047677289694547653, 0.0005127433687448502, 0.0005487138405442238, 0.0005846843123435974, 0.000620654784142971, 0.0006566252559423447, 0.0006925957277417183, 0.0007285661995410919, 0.0007645366713404655, 0.0008005071431398392, 0.0008364776149392128, 0.0008724480867385864, 0.00090841855853796, 0.0009443890303373337, 0.0009803595021367073, 0.001016329973936081, 0.0010523004457354546, 0.0010882709175348282, 0.0011242413893342018, 0.0011602118611335754, 0.001196182332932949, 0.0012321528047323227, 0.0012681232765316963, 0.00130409374833107, 0.0013400642201304436, 0.0013760346919298172, 0.0014120051637291908, 0.0014479756355285645]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 13.0, 24.0, 36.0, 32.0, 62.0, 83.0, 118.0, 162.0, 286.0, 381.0, 584.0, 940.0, 1550.0, 2575.0, 4714.0, 8813.0, 17360.0, 41374.0, 235358.0, 623616.0, 62569.0, 23148.0, 10850.0, 5678.0, 3063.0, 1905.0, 1146.0, 760.0, 433.0, 313.0, 183.0, 122.0, 89.0, 52.0, 57.0, 28.0, 28.0, 5.0, 13.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.8125, -16.170166015625, -15.52783203125, -14.885498046875, -14.2431640625, -13.600830078125, -12.95849609375, -12.316162109375, -11.673828125, -11.031494140625, -10.38916015625, -9.746826171875, -9.1044921875, -8.462158203125, -7.81982421875, -7.177490234375, -6.53515625, -5.892822265625, -5.25048828125, -4.608154296875, -3.9658203125, -3.323486328125, -2.68115234375, -2.038818359375, -1.396484375, -0.754150390625, -0.11181640625, 0.530517578125, 1.1728515625, 1.815185546875, 2.45751953125, 3.099853515625, 3.7421875, 4.384521484375, 5.02685546875, 5.669189453125, 6.3115234375, 6.953857421875, 7.59619140625, 8.238525390625, 8.880859375, 9.523193359375, 10.16552734375, 10.807861328125, 11.4501953125, 12.092529296875, 12.73486328125, 13.377197265625, 14.01953125, 14.661865234375, 15.30419921875, 15.946533203125, 16.5888671875, 17.231201171875, 17.87353515625, 18.515869140625, 19.158203125, 19.800537109375, 20.44287109375, 21.085205078125, 21.7275390625, 22.369873046875, 23.01220703125, 23.654541015625, 24.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 24.0, 25.0, 24.0, 34.0, 37.0, 33.0, 45.0, 50.0, 61.0, 85.0, 192.0, 1723.0, 121.0, 81.0, 58.0, 56.0, 44.0, 32.0, 28.0, 26.0, 34.0, 25.0, 16.0, 25.0, 11.0, 5.0, 20.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.27734375, -30.2109375, -29.14453125, -28.078125, -27.01171875, -25.9453125, -24.87890625, -23.8125, -22.74609375, -21.6796875, -20.61328125, -19.546875, -18.48046875, -17.4140625, -16.34765625, -15.28125, -14.21484375, -13.1484375, -12.08203125, -11.015625, -9.94921875, -8.8828125, -7.81640625, -6.75, -5.68359375, -4.6171875, -3.55078125, -2.484375, -1.41796875, -0.3515625, 0.71484375, 1.78125, 2.84765625, 3.9140625, 4.98046875, 6.046875, 7.11328125, 8.1796875, 9.24609375, 10.3125, 11.37890625, 12.4453125, 13.51171875, 14.578125, 15.64453125, 16.7109375, 17.77734375, 18.84375, 19.91015625, 20.9765625, 22.04296875, 23.109375, 24.17578125, 25.2421875, 26.30859375, 27.375, 28.44140625, 29.5078125, 30.57421875, 31.640625, 32.70703125, 33.7734375, 34.83984375, 35.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 33.0, 35.0, 35.0, 51.0, 71.0, 93.0, 127.0, 216.0, 364.0, 1078.0, 4535.0, 36465.0, 2971330.0, 119285.0, 8852.0, 1730.0, 544.0, 243.0, 172.0, 103.0, 71.0, 59.0, 38.0, 34.0, 21.0, 20.0, 10.0, 11.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.4833984375, -62.154296875, -59.8251953125, -57.49609375, -55.1669921875, -52.837890625, -50.5087890625, -48.1796875, -45.8505859375, -43.521484375, -41.1923828125, -38.86328125, -36.5341796875, -34.205078125, -31.8759765625, -29.546875, -27.2177734375, -24.888671875, -22.5595703125, -20.23046875, -17.9013671875, -15.572265625, -13.2431640625, -10.9140625, -8.5849609375, -6.255859375, -3.9267578125, -1.59765625, 0.7314453125, 3.060546875, 5.3896484375, 7.71875, 10.0478515625, 12.376953125, 14.7060546875, 17.03515625, 19.3642578125, 21.693359375, 24.0224609375, 26.3515625, 28.6806640625, 31.009765625, 33.3388671875, 35.66796875, 37.9970703125, 40.326171875, 42.6552734375, 44.984375, 47.3134765625, 49.642578125, 51.9716796875, 54.30078125, 56.6298828125, 58.958984375, 61.2880859375, 63.6171875, 65.9462890625, 68.275390625, 70.6044921875, 72.93359375, 75.2626953125, 77.591796875, 79.9208984375, 82.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 122.0, 866.0, 27.0], "bins": [-1239.0430908203125, -1219.1612548828125, -1199.279296875, -1179.3974609375, -1159.515625, -1139.6337890625, -1119.7518310546875, -1099.8699951171875, -1079.9881591796875, -1060.1063232421875, -1040.224365234375, -1020.342529296875, -1000.460693359375, -980.5787963867188, -960.6968994140625, -940.8150634765625, -920.93310546875, -901.0512084960938, -881.1693725585938, -861.2874755859375, -841.4056396484375, -821.5237426757812, -801.641845703125, -781.760009765625, -761.878173828125, -741.9962768554688, -722.1144409179688, -702.2325439453125, -682.3507080078125, -662.4688110351562, -642.5869140625, -622.705078125, -602.8231811523438, -582.9412841796875, -563.0594482421875, -543.1775512695312, -523.2957153320312, -503.413818359375, -483.5319519042969, -463.65008544921875, -443.7681884765625, -423.8863220214844, -404.00445556640625, -384.12255859375, -364.2406921386719, -344.35882568359375, -324.4769592285156, -304.5950927734375, -284.71319580078125, -264.8313293457031, -244.94944763183594, -225.0675811767578, -205.18569946289062, -185.3038330078125, -165.42196655273438, -145.5400848388672, -125.65821838378906, -105.7763442993164, -85.89447021484375, -66.01260375976562, -46.13072967529297, -26.248855590820312, -6.3669891357421875, 13.514892578125, 33.39675521850586]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 5.0, 6.0, 13.0, 14.0, 18.0, 23.0, 19.0, 21.0, 32.0, 28.0, 34.0, 34.0, 29.0, 35.0, 35.0, 31.0, 45.0, 38.0, 52.0, 36.0, 42.0, 38.0, 41.0, 35.0, 30.0, 29.0, 29.0, 30.0, 24.0, 13.0, 21.0, 12.0, 16.0, 13.0, 16.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.21829223632812, -75.77754974365234, -73.33680725097656, -70.89607238769531, -68.45532989501953, -66.01458740234375, -63.57384490966797, -61.13310241699219, -58.69236373901367, -56.25162124633789, -53.810882568359375, -51.370140075683594, -48.92939758300781, -46.4886589050293, -44.047916412353516, -41.607177734375, -39.16643524169922, -36.72569274902344, -34.28495407104492, -31.84421157836914, -29.403470993041992, -26.962730407714844, -24.521987915039062, -22.081247329711914, -19.640506744384766, -17.199766159057617, -14.759024620056152, -12.318283081054688, -9.877542495727539, -7.436801910400391, -4.996060371398926, -2.555318832397461, -0.11458587646484375, 2.326155185699463, 4.7668962478637695, 7.207637310028076, 9.648378372192383, 12.089118957519531, 14.529860496520996, 16.97060203552246, 19.41134262084961, 21.852083206176758, 24.292823791503906, 26.733566284179688, 29.174306869506836, 31.615047454833984, 34.055789947509766, 36.49652862548828, 38.93727111816406, 41.378013610839844, 43.81875228881836, 46.25949478149414, 48.700233459472656, 51.14097595214844, 53.58171844482422, 56.0224609375, 58.463199615478516, 60.9039421081543, 63.34468078613281, 65.7854232788086, 68.22616577148438, 70.66690063476562, 73.1076431274414, 75.54838562011719, 77.98912811279297]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 9.0, 14.0, 19.0, 23.0, 31.0, 28.0, 34.0, 26.0, 38.0, 33.0, 30.0, 40.0, 40.0, 41.0, 31.0, 34.0, 35.0, 44.0, 38.0, 38.0, 31.0, 35.0, 32.0, 29.0, 25.0, 23.0, 26.0, 17.0, 12.0, 7.0, 17.0, 8.0, 9.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-11.2421875, -10.89111328125, -10.5400390625, -10.18896484375, -9.837890625, -9.48681640625, -9.1357421875, -8.78466796875, -8.43359375, -8.08251953125, -7.7314453125, -7.38037109375, -7.029296875, -6.67822265625, -6.3271484375, -5.97607421875, -5.625, -5.27392578125, -4.9228515625, -4.57177734375, -4.220703125, -3.86962890625, -3.5185546875, -3.16748046875, -2.81640625, -2.46533203125, -2.1142578125, -1.76318359375, -1.412109375, -1.06103515625, -0.7099609375, -0.35888671875, -0.0078125, 0.34326171875, 0.6943359375, 1.04541015625, 1.396484375, 1.74755859375, 2.0986328125, 2.44970703125, 2.80078125, 3.15185546875, 3.5029296875, 3.85400390625, 4.205078125, 4.55615234375, 4.9072265625, 5.25830078125, 5.609375, 5.96044921875, 6.3115234375, 6.66259765625, 7.013671875, 7.36474609375, 7.7158203125, 8.06689453125, 8.41796875, 8.76904296875, 9.1201171875, 9.47119140625, 9.822265625, 10.17333984375, 10.5244140625, 10.87548828125, 11.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 14.0, 18.0, 19.0, 20.0, 26.0, 46.0, 70.0, 124.0, 200.0, 383.0, 794.0, 2090.0, 6047.0, 21449.0, 234319.0, 3529361.0, 362935.0, 25184.0, 6684.0, 2394.0, 986.0, 445.0, 224.0, 110.0, 77.0, 53.0, 41.0, 19.0, 27.0, 15.0, 11.0, 8.0, 10.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.16357421875, -36.8271484375, -35.49072265625, -34.154296875, -32.81787109375, -31.4814453125, -30.14501953125, -28.80859375, -27.47216796875, -26.1357421875, -24.79931640625, -23.462890625, -22.12646484375, -20.7900390625, -19.45361328125, -18.1171875, -16.78076171875, -15.4443359375, -14.10791015625, -12.771484375, -11.43505859375, -10.0986328125, -8.76220703125, -7.42578125, -6.08935546875, -4.7529296875, -3.41650390625, -2.080078125, -0.74365234375, 0.5927734375, 1.92919921875, 3.265625, 4.60205078125, 5.9384765625, 7.27490234375, 8.611328125, 9.94775390625, 11.2841796875, 12.62060546875, 13.95703125, 15.29345703125, 16.6298828125, 17.96630859375, 19.302734375, 20.63916015625, 21.9755859375, 23.31201171875, 24.6484375, 25.98486328125, 27.3212890625, 28.65771484375, 29.994140625, 31.33056640625, 32.6669921875, 34.00341796875, 35.33984375, 36.67626953125, 38.0126953125, 39.34912109375, 40.685546875, 42.02197265625, 43.3583984375, 44.69482421875, 46.03125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 13.0, 10.0, 16.0, 17.0, 24.0, 42.0, 43.0, 59.0, 70.0, 121.0, 205.0, 390.0, 726.0, 872.0, 573.0, 323.0, 185.0, 109.0, 71.0, 63.0, 28.0, 37.0, 11.0, 7.0, 9.0, 8.0, 3.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.28125, -31.438720703125, -30.59619140625, -29.753662109375, -28.9111328125, -28.068603515625, -27.22607421875, -26.383544921875, -25.541015625, -24.698486328125, -23.85595703125, -23.013427734375, -22.1708984375, -21.328369140625, -20.48583984375, -19.643310546875, -18.80078125, -17.958251953125, -17.11572265625, -16.273193359375, -15.4306640625, -14.588134765625, -13.74560546875, -12.903076171875, -12.060546875, -11.218017578125, -10.37548828125, -9.532958984375, -8.6904296875, -7.847900390625, -7.00537109375, -6.162841796875, -5.3203125, -4.477783203125, -3.63525390625, -2.792724609375, -1.9501953125, -1.107666015625, -0.26513671875, 0.577392578125, 1.419921875, 2.262451171875, 3.10498046875, 3.947509765625, 4.7900390625, 5.632568359375, 6.47509765625, 7.317626953125, 8.16015625, 9.002685546875, 9.84521484375, 10.687744140625, 11.5302734375, 12.372802734375, 13.21533203125, 14.057861328125, 14.900390625, 15.742919921875, 16.58544921875, 17.427978515625, 18.2705078125, 19.113037109375, 19.95556640625, 20.798095703125, 21.640625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 7.0, 8.0, 2.0, 9.0, 15.0, 33.0, 36.0, 54.0, 76.0, 142.0, 292.0, 1007.0, 22037.0, 4091031.0, 76887.0, 1793.0, 362.0, 147.0, 82.0, 62.0, 42.0, 38.0, 24.0, 21.0, 12.0, 11.0, 15.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.25, -125.359375, -120.46875, -115.578125, -110.6875, -105.796875, -100.90625, -96.015625, -91.125, -86.234375, -81.34375, -76.453125, -71.5625, -66.671875, -61.78125, -56.890625, -52.0, -47.109375, -42.21875, -37.328125, -32.4375, -27.546875, -22.65625, -17.765625, -12.875, -7.984375, -3.09375, 1.796875, 6.6875, 11.578125, 16.46875, 21.359375, 26.25, 31.140625, 36.03125, 40.921875, 45.8125, 50.703125, 55.59375, 60.484375, 65.375, 70.265625, 75.15625, 80.046875, 84.9375, 89.828125, 94.71875, 99.609375, 104.5, 109.390625, 114.28125, 119.171875, 124.0625, 128.953125, 133.84375, 138.734375, 143.625, 148.515625, 153.40625, 158.296875, 163.1875, 168.078125, 172.96875, 177.859375, 182.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 15.0, 39.0, 62.0, 133.0, 234.0, 234.0, 154.0, 82.0, 32.0, 11.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.8446960449219, -255.1780548095703, -249.51141357421875, -243.8447723388672, -238.17813110351562, -232.51148986816406, -226.8448486328125, -221.17822265625, -215.51156616210938, -209.8449249267578, -204.17828369140625, -198.5116424560547, -192.84500122070312, -187.17835998535156, -181.51171875, -175.8450927734375, -170.17845153808594, -164.51181030273438, -158.8451690673828, -153.17852783203125, -147.5118865966797, -141.84524536132812, -136.17861938476562, -130.511962890625, -124.84532928466797, -119.1786880493164, -113.51204681396484, -107.84541320800781, -102.17877197265625, -96.51213073730469, -90.84548950195312, -85.17884826660156, -79.51219177246094, -73.84555053710938, -68.17890930175781, -62.512271881103516, -56.84563064575195, -51.17898941040039, -45.512351989746094, -39.84571075439453, -34.17906951904297, -28.512428283691406, -22.845788955688477, -17.179149627685547, -11.512508392333984, -5.845867156982422, -0.179229736328125, 5.4874114990234375, 11.154052734375, 16.820693969726562, 22.487333297729492, 28.153972625732422, 33.820613861083984, 39.48725509643555, 45.153892517089844, 50.820533752441406, 56.48717498779297, 62.15381622314453, 67.8204574584961, 73.48709106445312, 79.15373229980469, 84.82037353515625, 90.48701477050781, 96.15365600585938, 101.82029724121094]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 7.0, 7.0, 19.0, 17.0, 12.0, 21.0, 17.0, 25.0, 18.0, 24.0, 31.0, 35.0, 38.0, 39.0, 25.0, 31.0, 41.0, 36.0, 37.0, 41.0, 38.0, 38.0, 36.0, 34.0, 50.0, 34.0, 24.0, 33.0, 27.0, 28.0, 20.0, 19.0, 12.0, 17.0, 10.0, 5.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-68.22395324707031, -66.15882110595703, -64.09368133544922, -62.02854919433594, -59.96341323852539, -57.898277282714844, -55.8331413269043, -53.76800537109375, -51.70287322998047, -49.63773727416992, -47.572601318359375, -45.507469177246094, -43.44233322143555, -41.377197265625, -39.31206130981445, -37.246925354003906, -35.18178939819336, -33.11665344238281, -31.0515193939209, -28.98638343811035, -26.921249389648438, -24.85611343383789, -22.790977478027344, -20.725841522216797, -18.660707473754883, -16.595571517944336, -14.530437469482422, -12.465301513671875, -10.400166511535645, -8.335031509399414, -6.269895553588867, -4.204760551452637, -2.1396255493164062, -0.07449030876159668, 1.990644931793213, 4.055780410766602, 6.120915412902832, 8.186050415039062, 10.25118637084961, 12.31632137298584, 14.38145637512207, 16.446592330932617, 18.51172637939453, 20.576862335205078, 22.641998291015625, 24.70713233947754, 26.772268295288086, 28.83740234375, 30.902538299560547, 32.967674255371094, 35.03281021118164, 37.09794616699219, 39.16307830810547, 41.228214263916016, 43.29335021972656, 45.35848617553711, 47.423622131347656, 49.4887580871582, 51.55389404296875, 53.61902618408203, 55.68416213989258, 57.749298095703125, 59.81443405151367, 61.87957000732422, 63.9447021484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 25.0, 39.0, 62.0, 89.0, 139.0, 243.0, 269.0, 428.0, 691.0, 1003.0, 1454.0, 2269.0, 3409.0, 5156.0, 7910.0, 12275.0, 19321.0, 30183.0, 48509.0, 77044.0, 120369.0, 187091.0, 191843.0, 123560.0, 78273.0, 49288.0, 31043.0, 19817.0, 12621.0, 8215.0, 5449.0, 3404.0, 2350.0, 1565.0, 1011.0, 704.0, 469.0, 307.0, 198.0, 134.0, 91.0, 56.0, 41.0, 32.0, 25.0, 15.0, 2.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.270751953125, -0.2625541687011719, -0.25435638427734375, -0.24615859985351562, -0.2379608154296875, -0.22976303100585938, -0.22156524658203125, -0.21336746215820312, -0.205169677734375, -0.19697189331054688, -0.18877410888671875, -0.18057632446289062, -0.1723785400390625, -0.16418075561523438, -0.15598297119140625, -0.14778518676757812, -0.13958740234375, -0.13138961791992188, -0.12319183349609375, -0.11499404907226562, -0.1067962646484375, -0.09859848022460938, -0.09040069580078125, -0.08220291137695312, -0.074005126953125, -0.06580734252929688, -0.05760955810546875, -0.049411773681640625, -0.0412139892578125, -0.033016204833984375, -0.02481842041015625, -0.016620635986328125, -0.0084228515625, -0.000225067138671875, 0.00797271728515625, 0.016170501708984375, 0.0243682861328125, 0.032566070556640625, 0.04076385498046875, 0.048961639404296875, 0.057159423828125, 0.06535720825195312, 0.07355499267578125, 0.08175277709960938, 0.0899505615234375, 0.09814834594726562, 0.10634613037109375, 0.11454391479492188, 0.12274169921875, 0.13093948364257812, 0.13913726806640625, 0.14733505249023438, 0.1555328369140625, 0.16373062133789062, 0.17192840576171875, 0.18012619018554688, 0.188323974609375, 0.19652175903320312, 0.20471954345703125, 0.21291732788085938, 0.2211151123046875, 0.22931289672851562, 0.23751068115234375, 0.24570846557617188, 0.25390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 4.0, 12.0, 15.0, 14.0, 15.0, 27.0, 15.0, 15.0, 20.0, 18.0, 29.0, 27.0, 28.0, 33.0, 26.0, 33.0, 49.0, 35.0, 38.0, 1068.0, 42.0, 35.0, 37.0, 35.0, 39.0, 38.0, 35.0, 19.0, 21.0, 28.0, 26.0, 21.0, 15.0, 15.0, 13.0, 18.0, 10.0, 9.0, 8.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9609375, -7.701904296875, -7.44287109375, -7.183837890625, -6.9248046875, -6.665771484375, -6.40673828125, -6.147705078125, -5.888671875, -5.629638671875, -5.37060546875, -5.111572265625, -4.8525390625, -4.593505859375, -4.33447265625, -4.075439453125, -3.81640625, -3.557373046875, -3.29833984375, -3.039306640625, -2.7802734375, -2.521240234375, -2.26220703125, -2.003173828125, -1.744140625, -1.485107421875, -1.22607421875, -0.967041015625, -0.7080078125, -0.448974609375, -0.18994140625, 0.069091796875, 0.328125, 0.587158203125, 0.84619140625, 1.105224609375, 1.3642578125, 1.623291015625, 1.88232421875, 2.141357421875, 2.400390625, 2.659423828125, 2.91845703125, 3.177490234375, 3.4365234375, 3.695556640625, 3.95458984375, 4.213623046875, 4.47265625, 4.731689453125, 4.99072265625, 5.249755859375, 5.5087890625, 5.767822265625, 6.02685546875, 6.285888671875, 6.544921875, 6.803955078125, 7.06298828125, 7.322021484375, 7.5810546875, 7.840087890625, 8.09912109375, 8.358154296875, 8.6171875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 6.0, 7.0, 11.0, 11.0, 19.0, 23.0, 38.0, 57.0, 92.0, 115.0, 174.0, 254.0, 324.0, 432.0, 681.0, 977.0, 1270.0, 1721.0, 2336.0, 3249.0, 4757.0, 6824.0, 9663.0, 13874.0, 20319.0, 29646.0, 44018.0, 67707.0, 106036.0, 172016.0, 1244791.0, 125251.0, 78771.0, 50890.0, 34106.0, 22939.0, 15990.0, 11174.0, 7684.0, 5576.0, 3761.0, 2725.0, 1924.0, 1426.0, 1023.0, 732.0, 494.0, 372.0, 240.0, 200.0, 129.0, 100.0, 58.0, 47.0, 34.0, 26.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.11517333984375, -0.11147880554199219, -0.10778427124023438, -0.10408973693847656, -0.10039520263671875, -0.09670066833496094, -0.09300613403320312, -0.08931159973144531, -0.0856170654296875, -0.08192253112792969, -0.07822799682617188, -0.07453346252441406, -0.07083892822265625, -0.06714439392089844, -0.06344985961914062, -0.05975532531738281, -0.056060791015625, -0.05236625671386719, -0.048671722412109375, -0.04497718811035156, -0.04128265380859375, -0.03758811950683594, -0.033893585205078125, -0.030199050903320312, -0.0265045166015625, -0.022809982299804688, -0.019115447998046875, -0.015420913696289062, -0.01172637939453125, -0.008031845092773438, -0.004337310791015625, -0.0006427764892578125, 0.0030517578125, 0.0067462921142578125, 0.010440826416015625, 0.014135360717773438, 0.01782989501953125, 0.021524429321289062, 0.025218963623046875, 0.028913497924804688, 0.0326080322265625, 0.03630256652832031, 0.039997100830078125, 0.04369163513183594, 0.04738616943359375, 0.05108070373535156, 0.054775238037109375, 0.05846977233886719, 0.062164306640625, 0.06585884094238281, 0.06955337524414062, 0.07324790954589844, 0.07694244384765625, 0.08063697814941406, 0.08433151245117188, 0.08802604675292969, 0.0917205810546875, 0.09541511535644531, 0.09910964965820312, 0.10280418395996094, 0.10649871826171875, 0.11019325256347656, 0.11388778686523438, 0.11758232116699219, 0.12127685546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 7.0, 11.0, 12.0, 12.0, 15.0, 29.0, 32.0, 28.0, 39.0, 41.0, 46.0, 56.0, 61.0, 62.0, 53.0, 67.0, 65.0, 59.0, 40.0, 44.0, 24.0, 28.0, 21.0, 18.0, 15.0, 11.0, 4.0, 9.0, 17.0, 3.0, 7.0, 1.0, 7.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0006089210510253906, -0.0005890354514122009, -0.0005691498517990112, -0.0005492642521858215, -0.0005293786525726318, -0.0005094930529594421, -0.0004896074533462524, -0.00046972185373306274, -0.00044983625411987305, -0.00042995065450668335, -0.00041006505489349365, -0.00039017945528030396, -0.00037029385566711426, -0.00035040825605392456, -0.00033052265644073486, -0.00031063705682754517, -0.00029075145721435547, -0.00027086585760116577, -0.0002509802579879761, -0.00023109465837478638, -0.00021120905876159668, -0.00019132345914840698, -0.00017143785953521729, -0.0001515522599220276, -0.0001316666603088379, -0.0001117810606956482, -9.18954610824585e-05, -7.20098614692688e-05, -5.21242618560791e-05, -3.2238662242889404e-05, -1.2353062629699707e-05, 7.53253698348999e-06, 2.7418136596679688e-05, 4.7303736209869385e-05, 6.718933582305908e-05, 8.707493543624878e-05, 0.00010696053504943848, 0.00012684613466262817, 0.00014673173427581787, 0.00016661733388900757, 0.00018650293350219727, 0.00020638853311538696, 0.00022627413272857666, 0.00024615973234176636, 0.00026604533195495605, 0.00028593093156814575, 0.00030581653118133545, 0.00032570213079452515, 0.00034558773040771484, 0.00036547333002090454, 0.00038535892963409424, 0.00040524452924728394, 0.00042513012886047363, 0.00044501572847366333, 0.00046490132808685303, 0.0004847869277000427, 0.0005046725273132324, 0.0005245581269264221, 0.0005444437265396118, 0.0005643293261528015, 0.0005842149257659912, 0.0006041005253791809, 0.0006239861249923706, 0.0006438717246055603, 0.00066375732421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 7.0, 2.0, 4.0, 3.0, 19.0, 9.0, 4.0, 11.0, 14.0, 19.0, 26.0, 29.0, 36.0, 56.0, 69.0, 125.0, 234.0, 660.0, 17312.0, 1021426.0, 7418.0, 494.0, 185.0, 93.0, 58.0, 43.0, 46.0, 34.0, 18.0, 11.0, 11.0, 12.0, 8.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.015869140625, -0.015394210815429688, -0.014919281005859375, -0.014444351196289062, -0.01396942138671875, -0.013494491577148438, -0.013019561767578125, -0.012544631958007812, -0.0120697021484375, -0.011594772338867188, -0.011119842529296875, -0.010644912719726562, -0.01016998291015625, -0.009695053100585938, -0.009220123291015625, -0.008745193481445312, -0.008270263671875, -0.0077953338623046875, -0.007320404052734375, -0.0068454742431640625, -0.00637054443359375, -0.0058956146240234375, -0.005420684814453125, -0.0049457550048828125, -0.0044708251953125, -0.0039958953857421875, -0.003520965576171875, -0.0030460357666015625, -0.00257110595703125, -0.0020961761474609375, -0.001621246337890625, -0.0011463165283203125, -0.00067138671875, -0.0001964569091796875, 0.000278472900390625, 0.0007534027099609375, 0.00122833251953125, 0.0017032623291015625, 0.002178192138671875, 0.0026531219482421875, 0.0031280517578125, 0.0036029815673828125, 0.004077911376953125, 0.0045528411865234375, 0.00502777099609375, 0.0055027008056640625, 0.005977630615234375, 0.0064525604248046875, 0.006927490234375, 0.0074024200439453125, 0.007877349853515625, 0.008352279663085938, 0.00882720947265625, 0.009302139282226562, 0.009777069091796875, 0.010251998901367188, 0.0107269287109375, 0.011201858520507812, 0.011676788330078125, 0.012151718139648438, 0.01262664794921875, 0.013101577758789062, 0.013576507568359375, 0.014051437377929688, 0.0145263671875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 31.0, 982.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026336494833230972, -0.025868872180581093, -0.025401249527931213, -0.024933626875281334, -0.024466004222631454, -0.023998383432626724, -0.023530758917331696, -0.023063138127326965, -0.022595515474677086, -0.022127892822027206, -0.021660270169377327, -0.021192647516727448, -0.020725024864077568, -0.02025740221142769, -0.01978978142142296, -0.01932215876877308, -0.0188545361161232, -0.01838691346347332, -0.01791929081082344, -0.01745166815817356, -0.01698404550552368, -0.01651642471551895, -0.016048800200223923, -0.015581178478896618, -0.015113554894924164, -0.014645932242274284, -0.014178309589624405, -0.013710686936974525, -0.01324306521564722, -0.012775442562997341, -0.012307819910347462, -0.011840197257697582, -0.011372575536370277, -0.010904952883720398, -0.010437330231070518, -0.009969707578420639, -0.009502085857093334, -0.009034463204443455, -0.008566840551793575, -0.008099217899143696, -0.007631596177816391, -0.0071639735251665115, -0.006696351338177919, -0.00622872868552804, -0.005761106498539448, -0.005293483845889568, -0.004825861193239689, -0.004358238540589809, -0.0038906161207705736, -0.003422993700951338, -0.0029553710483014584, -0.0024877486284822226, -0.0020201262086629868, -0.001552503788843751, -0.0010848811361938715, -0.0006172587163746357, -0.0001496362965553999, 0.0003179861814714968, 0.0007856086594983935, 0.0012532311957329512, 0.001720853615552187, 0.0021884760353714228, 0.0026560986880213022, 0.003123721107840538, 0.003591343527659774]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 10.0, 11.0, 18.0, 15.0, 23.0, 34.0, 52.0, 49.0, 55.0, 49.0, 71.0, 72.0, 79.0, 77.0, 70.0, 58.0, 49.0, 39.0, 45.0, 35.0, 24.0, 18.0, 16.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008350610733032227, -0.0008047772571444511, -0.0007744934409856796, -0.0007442096248269081, -0.0007139258086681366, -0.0006836419925093651, -0.0006533581763505936, -0.000623074360191822, -0.0005927905440330505, -0.000562506727874279, -0.0005322229117155075, -0.000501939095556736, -0.0004716552793979645, -0.00044137146323919296, -0.00041108764708042145, -0.00038080383092164993, -0.0003505200147628784, -0.0003202361986041069, -0.0002899523824453354, -0.0002596685662865639, -0.00022938475012779236, -0.00019910093396902084, -0.00016881711781024933, -0.00013853330165147781, -0.0001082494854927063, -7.796566933393478e-05, -4.768185317516327e-05, -1.7398037016391754e-05, 1.288577914237976e-05, 4.3169595301151276e-05, 7.345341145992279e-05, 0.0001037372276186943, 0.00013402104377746582, 0.00016430485993623734, 0.00019458867609500885, 0.00022487249225378036, 0.0002551563084125519, 0.0002854401245713234, 0.0003157239407300949, 0.0003460077568888664, 0.00037629157304763794, 0.00040657538920640945, 0.00043685920536518097, 0.0004671430215239525, 0.000497426837682724, 0.0005277106538414955, 0.000557994470000267, 0.0005882782861590385, 0.0006185621023178101, 0.0006488459184765816, 0.0006791297346353531, 0.0007094135507941246, 0.0007396973669528961, 0.0007699811831116676, 0.0008002649992704391, 0.0008305488154292107, 0.0008608326315879822, 0.0008911164477467537, 0.0009214002639055252, 0.0009516840800642967, 0.0009819678962230682, 0.0010122517123818398, 0.0010425355285406113, 0.0010728193446993828, 0.0011031031608581543]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 5.0, 12.0, 14.0, 19.0, 23.0, 44.0, 65.0, 88.0, 115.0, 177.0, 276.0, 396.0, 575.0, 926.0, 1383.0, 2385.0, 4006.0, 7459.0, 15303.0, 41789.0, 288605.0, 585906.0, 59489.0, 18574.0, 8836.0, 4786.0, 2726.0, 1656.0, 983.0, 597.0, 409.0, 269.0, 198.0, 131.0, 113.0, 62.0, 32.0, 39.0, 28.0, 14.0, 10.0, 6.0, 3.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.7078857421875, -13.220458984375, -12.7330322265625, -12.24560546875, -11.7581787109375, -11.270751953125, -10.7833251953125, -10.2958984375, -9.8084716796875, -9.321044921875, -8.8336181640625, -8.34619140625, -7.8587646484375, -7.371337890625, -6.8839111328125, -6.396484375, -5.9090576171875, -5.421630859375, -4.9342041015625, -4.44677734375, -3.9593505859375, -3.471923828125, -2.9844970703125, -2.4970703125, -2.0096435546875, -1.522216796875, -1.0347900390625, -0.54736328125, -0.0599365234375, 0.427490234375, 0.9149169921875, 1.40234375, 1.8897705078125, 2.377197265625, 2.8646240234375, 3.35205078125, 3.8394775390625, 4.326904296875, 4.8143310546875, 5.3017578125, 5.7891845703125, 6.276611328125, 6.7640380859375, 7.25146484375, 7.7388916015625, 8.226318359375, 8.7137451171875, 9.201171875, 9.6885986328125, 10.176025390625, 10.6634521484375, 11.15087890625, 11.6383056640625, 12.125732421875, 12.6131591796875, 13.1005859375, 13.5880126953125, 14.075439453125, 14.5628662109375, 15.05029296875, 15.5377197265625, 16.025146484375, 16.5125732421875, 17.0]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 8.0, 11.0, 15.0, 22.0, 19.0, 18.0, 29.0, 37.0, 33.0, 30.0, 39.0, 45.0, 54.0, 82.0, 171.0, 1812.0, 114.0, 86.0, 55.0, 44.0, 41.0, 41.0, 31.0, 40.0, 26.0, 33.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.12646484375, -37.8779296875, -36.62939453125, -35.380859375, -34.13232421875, -32.8837890625, -31.63525390625, -30.38671875, -29.13818359375, -27.8896484375, -26.64111328125, -25.392578125, -24.14404296875, -22.8955078125, -21.64697265625, -20.3984375, -19.14990234375, -17.9013671875, -16.65283203125, -15.404296875, -14.15576171875, -12.9072265625, -11.65869140625, -10.41015625, -9.16162109375, -7.9130859375, -6.66455078125, -5.416015625, -4.16748046875, -2.9189453125, -1.67041015625, -0.421875, 0.82666015625, 2.0751953125, 3.32373046875, 4.572265625, 5.82080078125, 7.0693359375, 8.31787109375, 9.56640625, 10.81494140625, 12.0634765625, 13.31201171875, 14.560546875, 15.80908203125, 17.0576171875, 18.30615234375, 19.5546875, 20.80322265625, 22.0517578125, 23.30029296875, 24.548828125, 25.79736328125, 27.0458984375, 28.29443359375, 29.54296875, 30.79150390625, 32.0400390625, 33.28857421875, 34.537109375, 35.78564453125, 37.0341796875, 38.28271484375, 39.53125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 7.0, 5.0, 6.0, 6.0, 13.0, 14.0, 17.0, 27.0, 36.0, 46.0, 48.0, 71.0, 95.0, 136.0, 340.0, 1119.0, 10193.0, 2881240.0, 245333.0, 5405.0, 832.0, 221.0, 128.0, 70.0, 54.0, 51.0, 35.0, 33.0, 26.0, 22.0, 13.0, 11.0, 9.0, 6.0, 13.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-91.125, -88.2666015625, -85.408203125, -82.5498046875, -79.69140625, -76.8330078125, -73.974609375, -71.1162109375, -68.2578125, -65.3994140625, -62.541015625, -59.6826171875, -56.82421875, -53.9658203125, -51.107421875, -48.2490234375, -45.390625, -42.5322265625, -39.673828125, -36.8154296875, -33.95703125, -31.0986328125, -28.240234375, -25.3818359375, -22.5234375, -19.6650390625, -16.806640625, -13.9482421875, -11.08984375, -8.2314453125, -5.373046875, -2.5146484375, 0.34375, 3.2021484375, 6.060546875, 8.9189453125, 11.77734375, 14.6357421875, 17.494140625, 20.3525390625, 23.2109375, 26.0693359375, 28.927734375, 31.7861328125, 34.64453125, 37.5029296875, 40.361328125, 43.2197265625, 46.078125, 48.9365234375, 51.794921875, 54.6533203125, 57.51171875, 60.3701171875, 63.228515625, 66.0869140625, 68.9453125, 71.8037109375, 74.662109375, 77.5205078125, 80.37890625, 83.2373046875, 86.095703125, 88.9541015625, 91.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 16.0, 193.0, 543.0, 232.0, 24.0, 5.0, 0.0, 2.0], "bins": [-378.1009826660156, -371.63995361328125, -365.17889404296875, -358.7178649902344, -352.2568054199219, -345.7957763671875, -339.334716796875, -332.8736877441406, -326.41265869140625, -319.9516296386719, -313.4905700683594, -307.029541015625, -300.5684814453125, -294.1074523925781, -287.64642333984375, -281.18536376953125, -274.72430419921875, -268.2632751464844, -261.8022155761719, -255.3411865234375, -248.88014221191406, -242.41909790039062, -235.9580535888672, -229.49700927734375, -223.03598022460938, -216.57493591308594, -210.1138916015625, -203.65286254882812, -197.1918182373047, -190.73077392578125, -184.2697296142578, -177.80868530273438, -171.34765625, -164.88661193847656, -158.42556762695312, -151.96453857421875, -145.5034942626953, -139.04244995117188, -132.58140563964844, -126.120361328125, -119.65933227539062, -113.19828796386719, -106.73725128173828, -100.27620697021484, -93.81517028808594, -87.3541259765625, -80.89308166503906, -74.43203735351562, -67.97099304199219, -61.509952545166016, -55.048912048339844, -48.587867736816406, -42.126827239990234, -35.66578674316406, -29.204742431640625, -22.743701934814453, -16.282665252685547, -9.821623802185059, -3.3605823516845703, 3.1004600524902344, 9.561500549316406, 16.022541046142578, 22.483585357666016, 28.944625854492188, 35.40566635131836]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 7.0, 19.0, 15.0, 14.0, 22.0, 25.0, 24.0, 27.0, 26.0, 25.0, 32.0, 29.0, 38.0, 34.0, 39.0, 33.0, 40.0, 45.0, 38.0, 45.0, 38.0, 32.0, 26.0, 29.0, 25.0, 24.0, 24.0, 18.0, 23.0, 22.0, 16.0, 24.0, 16.0, 8.0, 15.0, 8.0, 5.0, 4.0, 10.0, 3.0, 6.0, 5.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-84.20744323730469, -81.36939239501953, -78.53133392333984, -75.69328308105469, -72.855224609375, -70.01717376708984, -67.17912292480469, -64.341064453125, -61.503013610839844, -58.66495895385742, -55.826904296875, -52.988853454589844, -50.15079879760742, -47.312744140625, -44.474693298339844, -41.63663864135742, -38.798583984375, -35.96052932739258, -33.122474670410156, -30.284423828125, -27.446369171142578, -24.608314514160156, -21.770261764526367, -18.932209014892578, -16.094154357910156, -13.25610065460205, -10.418046951293945, -7.57999324798584, -4.741939544677734, -1.903885841369629, 0.9341678619384766, 3.7722206115722656, 6.6102752685546875, 9.448328971862793, 12.286382675170898, 15.124436378479004, 17.96249008178711, 20.80054473876953, 23.63859748840332, 26.47665023803711, 29.31470489501953, 32.15275955200195, 34.990814208984375, 37.82886505126953, 40.66691970825195, 43.504974365234375, 46.34302520751953, 49.18107986450195, 52.019134521484375, 54.8571891784668, 57.69524383544922, 60.533294677734375, 63.3713493347168, 66.20940399169922, 69.04745483398438, 71.88551330566406, 74.72356414794922, 77.56161499023438, 80.39967346191406, 83.23772430419922, 86.07577514648438, 88.91383361816406, 91.75188446044922, 94.58993530273438, 97.42799377441406]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 13.0, 15.0, 18.0, 22.0, 23.0, 22.0, 27.0, 27.0, 37.0, 30.0, 31.0, 33.0, 31.0, 34.0, 40.0, 34.0, 48.0, 44.0, 47.0, 39.0, 31.0, 46.0, 38.0, 32.0, 23.0, 25.0, 19.0, 20.0, 20.0, 18.0, 13.0, 13.0, 7.0, 11.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.6953125, -11.310546875, -10.92578125, -10.541015625, -10.15625, -9.771484375, -9.38671875, -9.001953125, -8.6171875, -8.232421875, -7.84765625, -7.462890625, -7.078125, -6.693359375, -6.30859375, -5.923828125, -5.5390625, -5.154296875, -4.76953125, -4.384765625, -4.0, -3.615234375, -3.23046875, -2.845703125, -2.4609375, -2.076171875, -1.69140625, -1.306640625, -0.921875, -0.537109375, -0.15234375, 0.232421875, 0.6171875, 1.001953125, 1.38671875, 1.771484375, 2.15625, 2.541015625, 2.92578125, 3.310546875, 3.6953125, 4.080078125, 4.46484375, 4.849609375, 5.234375, 5.619140625, 6.00390625, 6.388671875, 6.7734375, 7.158203125, 7.54296875, 7.927734375, 8.3125, 8.697265625, 9.08203125, 9.466796875, 9.8515625, 10.236328125, 10.62109375, 11.005859375, 11.390625, 11.775390625, 12.16015625, 12.544921875, 12.9296875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 26.0, 42.0, 50.0, 81.0, 123.0, 172.0, 232.0, 317.0, 463.0, 723.0, 1092.0, 1612.0, 2520.0, 3823.0, 6411.0, 10861.0, 20646.0, 49804.0, 157302.0, 576315.0, 1623025.0, 1191677.0, 378867.0, 97068.0, 32230.0, 15359.0, 8634.0, 5103.0, 3222.0, 2047.0, 1459.0, 915.0, 545.0, 407.0, 309.0, 211.0, 152.0, 122.0, 79.0, 56.0, 30.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0], "bins": [-14.421875, -13.9686279296875, -13.515380859375, -13.0621337890625, -12.60888671875, -12.1556396484375, -11.702392578125, -11.2491455078125, -10.7958984375, -10.3426513671875, -9.889404296875, -9.4361572265625, -8.98291015625, -8.5296630859375, -8.076416015625, -7.6231689453125, -7.169921875, -6.7166748046875, -6.263427734375, -5.8101806640625, -5.35693359375, -4.9036865234375, -4.450439453125, -3.9971923828125, -3.5439453125, -3.0906982421875, -2.637451171875, -2.1842041015625, -1.73095703125, -1.2777099609375, -0.824462890625, -0.3712158203125, 0.08203125, 0.5352783203125, 0.988525390625, 1.4417724609375, 1.89501953125, 2.3482666015625, 2.801513671875, 3.2547607421875, 3.7080078125, 4.1612548828125, 4.614501953125, 5.0677490234375, 5.52099609375, 5.9742431640625, 6.427490234375, 6.8807373046875, 7.333984375, 7.7872314453125, 8.240478515625, 8.6937255859375, 9.14697265625, 9.6002197265625, 10.053466796875, 10.5067138671875, 10.9599609375, 11.4132080078125, 11.866455078125, 12.3197021484375, 12.77294921875, 13.2261962890625, 13.679443359375, 14.1326904296875, 14.5859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 13.0, 22.0, 34.0, 35.0, 52.0, 64.0, 81.0, 154.0, 226.0, 411.0, 695.0, 823.0, 589.0, 311.0, 167.0, 104.0, 63.0, 57.0, 34.0, 23.0, 20.0, 20.0, 17.0, 10.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.96875, -35.07568359375, -34.1826171875, -33.28955078125, -32.396484375, -31.50341796875, -30.6103515625, -29.71728515625, -28.82421875, -27.93115234375, -27.0380859375, -26.14501953125, -25.251953125, -24.35888671875, -23.4658203125, -22.57275390625, -21.6796875, -20.78662109375, -19.8935546875, -19.00048828125, -18.107421875, -17.21435546875, -16.3212890625, -15.42822265625, -14.53515625, -13.64208984375, -12.7490234375, -11.85595703125, -10.962890625, -10.06982421875, -9.1767578125, -8.28369140625, -7.390625, -6.49755859375, -5.6044921875, -4.71142578125, -3.818359375, -2.92529296875, -2.0322265625, -1.13916015625, -0.24609375, 0.64697265625, 1.5400390625, 2.43310546875, 3.326171875, 4.21923828125, 5.1123046875, 6.00537109375, 6.8984375, 7.79150390625, 8.6845703125, 9.57763671875, 10.470703125, 11.36376953125, 12.2568359375, 13.14990234375, 14.04296875, 14.93603515625, 15.8291015625, 16.72216796875, 17.615234375, 18.50830078125, 19.4013671875, 20.29443359375, 21.1875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 13.0, 19.0, 15.0, 23.0, 32.0, 29.0, 63.0, 97.0, 219.0, 536.0, 3075.0, 75594.0, 4028231.0, 82041.0, 3088.0, 594.0, 230.0, 106.0, 80.0, 48.0, 32.0, 35.0, 17.0, 12.0, 15.0, 4.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -83.8701171875, -80.302734375, -76.7353515625, -73.16796875, -69.6005859375, -66.033203125, -62.4658203125, -58.8984375, -55.3310546875, -51.763671875, -48.1962890625, -44.62890625, -41.0615234375, -37.494140625, -33.9267578125, -30.359375, -26.7919921875, -23.224609375, -19.6572265625, -16.08984375, -12.5224609375, -8.955078125, -5.3876953125, -1.8203125, 1.7470703125, 5.314453125, 8.8818359375, 12.44921875, 16.0166015625, 19.583984375, 23.1513671875, 26.71875, 30.2861328125, 33.853515625, 37.4208984375, 40.98828125, 44.5556640625, 48.123046875, 51.6904296875, 55.2578125, 58.8251953125, 62.392578125, 65.9599609375, 69.52734375, 73.0947265625, 76.662109375, 80.2294921875, 83.796875, 87.3642578125, 90.931640625, 94.4990234375, 98.06640625, 101.6337890625, 105.201171875, 108.7685546875, 112.3359375, 115.9033203125, 119.470703125, 123.0380859375, 126.60546875, 130.1728515625, 133.740234375, 137.3076171875, 140.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 21.0, 43.0, 104.0, 225.0, 298.0, 188.0, 87.0, 32.0, 12.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-356.9347229003906, -350.2441101074219, -343.5534973144531, -336.8628845214844, -330.1722717285156, -323.48162841796875, -316.791015625, -310.10040283203125, -303.4097900390625, -296.71917724609375, -290.028564453125, -283.33795166015625, -276.6473388671875, -269.95672607421875, -263.2660827636719, -256.5754699707031, -249.88485717773438, -243.19424438476562, -236.50363159179688, -229.81300354003906, -223.1223907470703, -216.43177795410156, -209.7411651611328, -203.050537109375, -196.3599395751953, -189.66932678222656, -182.9787139892578, -176.2880859375, -169.59747314453125, -162.9068603515625, -156.21624755859375, -149.525634765625, -142.8350067138672, -136.14439392089844, -129.4537811279297, -122.7631607055664, -116.07254028320312, -109.38192749023438, -102.69131469726562, -96.00069427490234, -89.31007385253906, -82.61946105957031, -75.92884063720703, -69.23822784423828, -62.547607421875, -55.85699462890625, -49.166378021240234, -42.47576141357422, -35.78514862060547, -29.094532012939453, -22.403915405273438, -15.713300704956055, -9.022684097290039, -2.3320693969726562, 4.358547210693359, 11.049163818359375, 17.73978042602539, 24.430397033691406, 31.121013641357422, 37.81163024902344, 44.50224304199219, 51.1928596496582, 57.88347625732422, 64.5740966796875, 71.26470947265625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 11.0, 5.0, 11.0, 8.0, 9.0, 14.0, 8.0, 14.0, 12.0, 14.0, 17.0, 15.0, 24.0, 22.0, 24.0, 30.0, 30.0, 38.0, 25.0, 39.0, 39.0, 46.0, 25.0, 45.0, 43.0, 23.0, 39.0, 31.0, 29.0, 31.0, 34.0, 27.0, 33.0, 14.0, 31.0, 16.0, 11.0, 26.0, 10.0, 12.0, 12.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.083892822265625, -59.129764556884766, -57.175636291503906, -55.22150802612305, -53.26737976074219, -51.313255310058594, -49.359127044677734, -47.404998779296875, -45.450870513916016, -43.496742248535156, -41.5426139831543, -39.58848571777344, -37.634361267089844, -35.68022918701172, -33.726104736328125, -31.771976470947266, -29.817848205566406, -27.863719940185547, -25.909591674804688, -23.95546531677246, -22.0013370513916, -20.047208786010742, -18.093082427978516, -16.138954162597656, -14.184825897216797, -12.230697631835938, -10.276570320129395, -8.322443008422852, -6.368314743041992, -4.414186477661133, -2.46005916595459, -0.5059318542480469, 1.4481964111328125, 3.4023241996765137, 5.356451988220215, 7.310579776763916, 9.264707565307617, 11.218835830688477, 13.17296314239502, 15.127090454101562, 17.081218719482422, 19.03534698486328, 20.98947525024414, 22.943601608276367, 24.897729873657227, 26.851858139038086, 28.805984497070312, 30.760112762451172, 32.71424102783203, 34.66836929321289, 36.62249755859375, 38.57662582397461, 40.53075408935547, 42.48487854003906, 44.43900680541992, 46.39313507080078, 48.34726333618164, 50.3013916015625, 52.25551986694336, 54.20964813232422, 56.16377258300781, 58.11790466308594, 60.07202911376953, 62.02615737915039, 63.98028564453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 20.0, 34.0, 33.0, 58.0, 89.0, 116.0, 192.0, 279.0, 402.0, 584.0, 900.0, 1293.0, 1802.0, 2693.0, 4068.0, 6039.0, 9374.0, 14132.0, 21761.0, 34075.0, 52989.0, 82495.0, 129726.0, 193510.0, 175237.0, 113171.0, 71329.0, 46019.0, 29680.0, 19181.0, 12604.0, 8176.0, 5424.0, 3586.0, 2434.0, 1577.0, 1099.0, 730.0, 488.0, 339.0, 252.0, 172.0, 122.0, 60.0, 56.0, 47.0, 31.0, 24.0, 12.0, 5.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.251953125, -0.24404144287109375, -0.2361297607421875, -0.22821807861328125, -0.220306396484375, -0.21239471435546875, -0.2044830322265625, -0.19657135009765625, -0.18865966796875, -0.18074798583984375, -0.1728363037109375, -0.16492462158203125, -0.157012939453125, -0.14910125732421875, -0.1411895751953125, -0.13327789306640625, -0.1253662109375, -0.11745452880859375, -0.1095428466796875, -0.10163116455078125, -0.093719482421875, -0.08580780029296875, -0.0778961181640625, -0.06998443603515625, -0.06207275390625, -0.05416107177734375, -0.0462493896484375, -0.03833770751953125, -0.030426025390625, -0.02251434326171875, -0.0146026611328125, -0.00669097900390625, 0.001220703125, 0.00913238525390625, 0.0170440673828125, 0.02495574951171875, 0.032867431640625, 0.04077911376953125, 0.0486907958984375, 0.05660247802734375, 0.06451416015625, 0.07242584228515625, 0.0803375244140625, 0.08824920654296875, 0.096160888671875, 0.10407257080078125, 0.1119842529296875, 0.11989593505859375, 0.1278076171875, 0.13571929931640625, 0.1436309814453125, 0.15154266357421875, 0.159454345703125, 0.16736602783203125, 0.1752777099609375, 0.18318939208984375, 0.19110107421875, 0.19901275634765625, 0.2069244384765625, 0.21483612060546875, 0.222747802734375, 0.23065948486328125, 0.2385711669921875, 0.24648284912109375, 0.25439453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 16.0, 10.0, 12.0, 18.0, 15.0, 14.0, 19.0, 27.0, 28.0, 28.0, 36.0, 36.0, 42.0, 28.0, 35.0, 26.0, 33.0, 34.0, 1055.0, 34.0, 32.0, 36.0, 30.0, 36.0, 30.0, 32.0, 28.0, 33.0, 24.0, 25.0, 27.0, 20.0, 29.0, 12.0, 11.0, 11.0, 13.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9921875, -7.7354736328125, -7.478759765625, -7.2220458984375, -6.96533203125, -6.7086181640625, -6.451904296875, -6.1951904296875, -5.9384765625, -5.6817626953125, -5.425048828125, -5.1683349609375, -4.91162109375, -4.6549072265625, -4.398193359375, -4.1414794921875, -3.884765625, -3.6280517578125, -3.371337890625, -3.1146240234375, -2.85791015625, -2.6011962890625, -2.344482421875, -2.0877685546875, -1.8310546875, -1.5743408203125, -1.317626953125, -1.0609130859375, -0.80419921875, -0.5474853515625, -0.290771484375, -0.0340576171875, 0.22265625, 0.4793701171875, 0.736083984375, 0.9927978515625, 1.24951171875, 1.5062255859375, 1.762939453125, 2.0196533203125, 2.2763671875, 2.5330810546875, 2.789794921875, 3.0465087890625, 3.30322265625, 3.5599365234375, 3.816650390625, 4.0733642578125, 4.330078125, 4.5867919921875, 4.843505859375, 5.1002197265625, 5.35693359375, 5.6136474609375, 5.870361328125, 6.1270751953125, 6.3837890625, 6.6405029296875, 6.897216796875, 7.1539306640625, 7.41064453125, 7.6673583984375, 7.924072265625, 8.1807861328125, 8.4375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 12.0, 12.0, 6.0, 29.0, 34.0, 55.0, 80.0, 92.0, 156.0, 206.0, 291.0, 398.0, 560.0, 764.0, 1138.0, 1611.0, 2183.0, 3201.0, 4589.0, 6509.0, 9522.0, 13725.0, 20087.0, 29447.0, 43131.0, 63589.0, 95331.0, 146462.0, 1235461.0, 138184.0, 90271.0, 60205.0, 40844.0, 27498.0, 18589.0, 12976.0, 8881.0, 6344.0, 4426.0, 2934.0, 2012.0, 1527.0, 1145.0, 754.0, 563.0, 392.0, 275.0, 184.0, 128.0, 101.0, 74.0, 57.0, 30.0, 24.0, 18.0, 11.0, 3.0, 3.0, 3.0, 1.0, 4.0], "bins": [-0.11627197265625, -0.11257266998291016, -0.10887336730957031, -0.10517406463623047, -0.10147476196289062, -0.09777545928955078, -0.09407615661621094, -0.0903768539428711, -0.08667755126953125, -0.0829782485961914, -0.07927894592285156, -0.07557964324951172, -0.07188034057617188, -0.06818103790283203, -0.06448173522949219, -0.060782432556152344, -0.0570831298828125, -0.053383827209472656, -0.04968452453613281, -0.04598522186279297, -0.042285919189453125, -0.03858661651611328, -0.03488731384277344, -0.031188011169433594, -0.02748870849609375, -0.023789405822753906, -0.020090103149414062, -0.01639080047607422, -0.012691497802734375, -0.008992195129394531, -0.0052928924560546875, -0.0015935897827148438, 0.002105712890625, 0.005805015563964844, 0.009504318237304688, 0.013203620910644531, 0.016902923583984375, 0.02060222625732422, 0.024301528930664062, 0.028000831604003906, 0.03170013427734375, 0.035399436950683594, 0.03909873962402344, 0.04279804229736328, 0.046497344970703125, 0.05019664764404297, 0.05389595031738281, 0.057595252990722656, 0.0612945556640625, 0.06499385833740234, 0.06869316101074219, 0.07239246368408203, 0.07609176635742188, 0.07979106903076172, 0.08349037170410156, 0.0871896743774414, 0.09088897705078125, 0.0945882797241211, 0.09828758239746094, 0.10198688507080078, 0.10568618774414062, 0.10938549041748047, 0.11308479309082031, 0.11678409576416016, 0.1204833984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 9.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 23.0, 33.0, 42.0, 36.0, 66.0, 42.0, 61.0, 47.0, 85.0, 61.0, 56.0, 56.0, 42.0, 48.0, 37.0, 36.0, 27.0, 21.0, 16.0, 14.0, 11.0, 5.0, 9.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0006504058837890625, -0.0006269589066505432, -0.0006035119295120239, -0.0005800649523735046, -0.0005566179752349854, -0.0005331709980964661, -0.0005097240209579468, -0.0004862770438194275, -0.0004628300666809082, -0.0004393830895423889, -0.00041593611240386963, -0.00039248913526535034, -0.00036904215812683105, -0.00034559518098831177, -0.0003221482038497925, -0.0002987012267112732, -0.0002752542495727539, -0.0002518072724342346, -0.00022836029529571533, -0.00020491331815719604, -0.00018146634101867676, -0.00015801936388015747, -0.00013457238674163818, -0.0001111254096031189, -8.767843246459961e-05, -6.423145532608032e-05, -4.0784478187561035e-05, -1.7337501049041748e-05, 6.109476089477539e-06, 2.9556453227996826e-05, 5.300343036651611e-05, 7.64504075050354e-05, 9.989738464355469e-05, 0.00012334436178207397, 0.00014679133892059326, 0.00017023831605911255, 0.00019368529319763184, 0.00021713227033615112, 0.0002405792474746704, 0.0002640262246131897, 0.000287473201751709, 0.00031092017889022827, 0.00033436715602874756, 0.00035781413316726685, 0.00038126111030578613, 0.0004047080874443054, 0.0004281550645828247, 0.000451602041721344, 0.0004750490188598633, 0.0004984959959983826, 0.0005219429731369019, 0.0005453899502754211, 0.0005688369274139404, 0.0005922839045524597, 0.000615730881690979, 0.0006391778588294983, 0.0006626248359680176, 0.0006860718131065369, 0.0007095187902450562, 0.0007329657673835754, 0.0007564127445220947, 0.000779859721660614, 0.0008033066987991333, 0.0008267536759376526, 0.0008502006530761719]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 8.0, 17.0, 17.0, 22.0, 31.0, 49.0, 40.0, 91.0, 91.0, 217.0, 580.0, 17410.0, 1026642.0, 2394.0, 377.0, 144.0, 115.0, 46.0, 56.0, 39.0, 26.0, 16.0, 16.0, 11.0, 13.0, 11.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02056884765625, -0.020002365112304688, -0.019435882568359375, -0.018869400024414062, -0.01830291748046875, -0.017736434936523438, -0.017169952392578125, -0.016603469848632812, -0.0160369873046875, -0.015470504760742188, -0.014904022216796875, -0.014337539672851562, -0.01377105712890625, -0.013204574584960938, -0.012638092041015625, -0.012071609497070312, -0.011505126953125, -0.010938644409179688, -0.010372161865234375, -0.009805679321289062, -0.00923919677734375, -0.008672714233398438, -0.008106231689453125, -0.0075397491455078125, -0.0069732666015625, -0.0064067840576171875, -0.005840301513671875, -0.0052738189697265625, -0.00470733642578125, -0.0041408538818359375, -0.003574371337890625, -0.0030078887939453125, -0.00244140625, -0.0018749237060546875, -0.001308441162109375, -0.0007419586181640625, -0.00017547607421875, 0.0003910064697265625, 0.000957489013671875, 0.0015239715576171875, 0.0020904541015625, 0.0026569366455078125, 0.003223419189453125, 0.0037899017333984375, 0.00435638427734375, 0.0049228668212890625, 0.005489349365234375, 0.0060558319091796875, 0.006622314453125, 0.0071887969970703125, 0.007755279541015625, 0.008321762084960938, 0.00888824462890625, 0.009454727172851562, 0.010021209716796875, 0.010587692260742188, 0.0111541748046875, 0.011720657348632812, 0.012287139892578125, 0.012853622436523438, 0.01342010498046875, 0.013986587524414062, 0.014553070068359375, 0.015119552612304688, 0.01568603515625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 21.0, 964.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013575304299592972, -0.013312075287103653, -0.013048846274614334, -0.01278561633080244, -0.012522387318313122, -0.012259158305823803, -0.011995929293334484, -0.01173269934952259, -0.011469470337033272, -0.011206241324543953, -0.010943012312054634, -0.01067978236824274, -0.010416553355753422, -0.010153324343264103, -0.009890095330774784, -0.00962686538696289, -0.009363636374473572, -0.009100407361984253, -0.008837178349494934, -0.00857394840568304, -0.008310719393193722, -0.008047490380704403, -0.007784261368215084, -0.007521031890064478, -0.007257803343236446, -0.0069945743307471275, -0.006731344852596521, -0.0064681158401072025, -0.006204886361956596, -0.0059416573494672775, -0.005678428336977959, -0.0054151988588273525, -0.005151968449354172, -0.004888739436864853, -0.004625509958714247, -0.004362280946224928, -0.004099051468074322, -0.003835822455585003, -0.0035725932102650404, -0.003309363964945078, -0.003046134952455759, -0.0027829057071357965, -0.002519676461815834, -0.002256447449326515, -0.001993217971175909, -0.0017299888422712684, -0.0014667597133666277, -0.0012035304680466652, -0.0009403012227267027, -0.0006770719774067402, -0.0004138427902944386, -0.000150613603182137, 0.00011261564213782549, 0.000375844887457788, 0.0006390740163624287, 0.0009023032616823912, 0.0011655325070023537, 0.0014287617523223162, 0.0016919909976422787, 0.0019552200101315975, 0.0022184494882822037, 0.0024816785007715225, 0.002744907746091485, 0.0030081369914114475, 0.00327136623673141]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 23.0, 25.0, 31.0, 31.0, 56.0, 52.0, 70.0, 73.0, 93.0, 68.0, 83.0, 67.0, 61.0, 46.0, 53.0, 45.0, 33.0, 26.0, 21.0, 5.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000981152057647705, -0.0009465292096138, -0.000911906361579895, -0.00087728351354599, -0.000842660665512085, -0.0008080378174781799, -0.0007734149694442749, -0.0007387921214103699, -0.0007041692733764648, -0.0006695464253425598, -0.0006349235773086548, -0.0006003007292747498, -0.0005656778812408447, -0.0005310550332069397, -0.0004964321851730347, -0.00046180933713912964, -0.0004271864891052246, -0.0003925636410713196, -0.00035794079303741455, -0.0003233179450035095, -0.0002886950969696045, -0.00025407224893569946, -0.00021944940090179443, -0.0001848265528678894, -0.00015020370483398438, -0.00011558085680007935, -8.095800876617432e-05, -4.633516073226929e-05, -1.1712312698364258e-05, 2.291053533554077e-05, 5.75333833694458e-05, 9.215623140335083e-05, 0.00012677907943725586, 0.0001614019274711609, 0.00019602477550506592, 0.00023064762353897095, 0.000265270471572876, 0.000299893319606781, 0.00033451616764068604, 0.00036913901567459106, 0.0004037618637084961, 0.0004383847117424011, 0.00047300755977630615, 0.0005076304078102112, 0.0005422532558441162, 0.0005768761038780212, 0.0006114989519119263, 0.0006461217999458313, 0.0006807446479797363, 0.0007153674960136414, 0.0007499903440475464, 0.0007846131920814514, 0.0008192360401153564, 0.0008538588881492615, 0.0008884817361831665, 0.0009231045842170715, 0.0009577274322509766, 0.0009923502802848816, 0.0010269731283187866, 0.0010615959763526917, 0.0010962188243865967, 0.0011308416724205017, 0.0011654645204544067, 0.0012000873684883118, 0.0012347102165222168]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 23.0, 27.0, 47.0, 64.0, 76.0, 114.0, 143.0, 217.0, 275.0, 389.0, 542.0, 839.0, 1216.0, 1710.0, 2669.0, 3970.0, 6194.0, 10212.0, 17637.0, 35771.0, 123558.0, 606771.0, 147948.0, 39043.0, 18968.0, 10721.0, 6557.0, 4097.0, 2784.0, 1787.0, 1241.0, 859.0, 604.0, 425.0, 294.0, 195.0, 144.0, 107.0, 85.0, 55.0, 40.0, 35.0, 22.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-18.609375, -18.0546875, -17.5, -16.9453125, -16.390625, -15.8359375, -15.28125, -14.7265625, -14.171875, -13.6171875, -13.0625, -12.5078125, -11.953125, -11.3984375, -10.84375, -10.2890625, -9.734375, -9.1796875, -8.625, -8.0703125, -7.515625, -6.9609375, -6.40625, -5.8515625, -5.296875, -4.7421875, -4.1875, -3.6328125, -3.078125, -2.5234375, -1.96875, -1.4140625, -0.859375, -0.3046875, 0.25, 0.8046875, 1.359375, 1.9140625, 2.46875, 3.0234375, 3.578125, 4.1328125, 4.6875, 5.2421875, 5.796875, 6.3515625, 6.90625, 7.4609375, 8.015625, 8.5703125, 9.125, 9.6796875, 10.234375, 10.7890625, 11.34375, 11.8984375, 12.453125, 13.0078125, 13.5625, 14.1171875, 14.671875, 15.2265625, 15.78125, 16.3359375, 16.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 12.0, 19.0, 13.0, 16.0, 19.0, 14.0, 20.0, 32.0, 30.0, 38.0, 33.0, 38.0, 46.0, 49.0, 68.0, 101.0, 422.0, 1452.0, 113.0, 73.0, 61.0, 41.0, 48.0, 30.0, 39.0, 35.0, 31.0, 17.0, 32.0, 13.0, 16.0, 14.0, 14.0, 5.0, 9.0, 4.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.5625, -38.36376953125, -37.1650390625, -35.96630859375, -34.767578125, -33.56884765625, -32.3701171875, -31.17138671875, -29.97265625, -28.77392578125, -27.5751953125, -26.37646484375, -25.177734375, -23.97900390625, -22.7802734375, -21.58154296875, -20.3828125, -19.18408203125, -17.9853515625, -16.78662109375, -15.587890625, -14.38916015625, -13.1904296875, -11.99169921875, -10.79296875, -9.59423828125, -8.3955078125, -7.19677734375, -5.998046875, -4.79931640625, -3.6005859375, -2.40185546875, -1.203125, -0.00439453125, 1.1943359375, 2.39306640625, 3.591796875, 4.79052734375, 5.9892578125, 7.18798828125, 8.38671875, 9.58544921875, 10.7841796875, 11.98291015625, 13.181640625, 14.38037109375, 15.5791015625, 16.77783203125, 17.9765625, 19.17529296875, 20.3740234375, 21.57275390625, 22.771484375, 23.97021484375, 25.1689453125, 26.36767578125, 27.56640625, 28.76513671875, 29.9638671875, 31.16259765625, 32.361328125, 33.56005859375, 34.7587890625, 35.95751953125, 37.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 10.0, 7.0, 21.0, 25.0, 24.0, 35.0, 56.0, 49.0, 78.0, 117.0, 189.0, 316.0, 627.0, 1569.0, 4319.0, 14289.0, 63878.0, 2662290.0, 349577.0, 34120.0, 8918.0, 2792.0, 1076.0, 481.0, 247.0, 159.0, 112.0, 80.0, 44.0, 39.0, 31.0, 28.0, 19.0, 17.0, 12.0, 11.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.34375, -47.7421875, -46.140625, -44.5390625, -42.9375, -41.3359375, -39.734375, -38.1328125, -36.53125, -34.9296875, -33.328125, -31.7265625, -30.125, -28.5234375, -26.921875, -25.3203125, -23.71875, -22.1171875, -20.515625, -18.9140625, -17.3125, -15.7109375, -14.109375, -12.5078125, -10.90625, -9.3046875, -7.703125, -6.1015625, -4.5, -2.8984375, -1.296875, 0.3046875, 1.90625, 3.5078125, 5.109375, 6.7109375, 8.3125, 9.9140625, 11.515625, 13.1171875, 14.71875, 16.3203125, 17.921875, 19.5234375, 21.125, 22.7265625, 24.328125, 25.9296875, 27.53125, 29.1328125, 30.734375, 32.3359375, 33.9375, 35.5390625, 37.140625, 38.7421875, 40.34375, 41.9453125, 43.546875, 45.1484375, 46.75, 48.3515625, 49.953125, 51.5546875, 53.15625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 29.0, 97.0, 230.0, 314.0, 219.0, 76.0, 22.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84812545776367, -47.24433898925781, -41.64055252075195, -36.036766052246094, -30.432979583740234, -24.829193115234375, -19.225406646728516, -13.621620178222656, -8.017833709716797, -2.4140472412109375, 3.189739227294922, 8.793525695800781, 14.39731216430664, 20.0010986328125, 25.60488510131836, 31.20867156982422, 36.81245803833008, 42.41624450683594, 48.0200309753418, 53.623817443847656, 59.227603912353516, 64.83139038085938, 70.4351806640625, 76.0389633178711, 81.64274597167969, 87.24653625488281, 92.8503189086914, 98.4541015625, 104.05789184570312, 109.66168212890625, 115.26546478271484, 120.86924743652344, 126.47305297851562, 132.07684326171875, 137.68063354492188, 143.28440856933594, 148.88819885253906, 154.4919891357422, 160.09576416015625, 165.69955444335938, 171.3033447265625, 176.90713500976562, 182.51092529296875, 188.1147003173828, 193.71849060058594, 199.32228088378906, 204.92605590820312, 210.52984619140625, 216.13363647460938, 221.7374267578125, 227.34121704101562, 232.9449920654297, 238.5487823486328, 244.15257263183594, 249.75634765625, 255.36013793945312, 260.96392822265625, 266.5677185058594, 272.1715087890625, 277.7752990722656, 283.37908935546875, 288.98284912109375, 294.5866394042969, 300.1904296875, 305.7942199707031]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 9.0, 2.0, 7.0, 11.0, 8.0, 14.0, 10.0, 18.0, 17.0, 19.0, 15.0, 25.0, 36.0, 33.0, 31.0, 35.0, 32.0, 46.0, 34.0, 43.0, 45.0, 47.0, 37.0, 34.0, 30.0, 38.0, 28.0, 36.0, 26.0, 32.0, 30.0, 19.0, 23.0, 20.0, 18.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-104.2725830078125, -101.24817657470703, -98.22377014160156, -95.1993637084961, -92.17495727539062, -89.15054321289062, -86.12614440917969, -83.10173034667969, -80.07732391357422, -77.05291748046875, -74.02851104736328, -71.00410461425781, -67.97969818115234, -64.95529174804688, -61.93088150024414, -58.906471252441406, -55.8820686340332, -52.857662200927734, -49.833255767822266, -46.80884552001953, -43.78443908691406, -40.760032653808594, -37.735626220703125, -34.711219787597656, -31.686811447143555, -28.662405014038086, -25.637996673583984, -22.613590240478516, -19.589183807373047, -16.564775466918945, -13.540369033813477, -10.515960693359375, -7.491554260253906, -4.467146873474121, -1.4427399635314941, 1.5816669464111328, 4.606074333190918, 7.630481719970703, 10.654888153076172, 13.679296493530273, 16.703702926635742, 19.72810935974121, 22.752517700195312, 25.77692413330078, 28.80133056640625, 31.82573890686035, 34.85014343261719, 37.87455368041992, 40.89896011352539, 43.92336654663086, 46.94777297973633, 49.97218322753906, 52.99658966064453, 56.02099609375, 59.04540252685547, 62.06980895996094, 65.0942153930664, 68.11862182617188, 71.14302825927734, 74.16743469238281, 77.19184112548828, 80.21624755859375, 83.24066162109375, 86.26506805419922, 89.28947448730469]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 3.0, 11.0, 11.0, 15.0, 19.0, 19.0, 11.0, 27.0, 26.0, 39.0, 23.0, 18.0, 26.0, 32.0, 43.0, 40.0, 49.0, 33.0, 41.0, 49.0, 41.0, 47.0, 35.0, 50.0, 37.0, 30.0, 27.0, 37.0, 17.0, 24.0, 22.0, 13.0, 11.0, 14.0, 12.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.4041748046875, -12.995849609375, -12.5875244140625, -12.17919921875, -11.7708740234375, -11.362548828125, -10.9542236328125, -10.5458984375, -10.1375732421875, -9.729248046875, -9.3209228515625, -8.91259765625, -8.5042724609375, -8.095947265625, -7.6876220703125, -7.279296875, -6.8709716796875, -6.462646484375, -6.0543212890625, -5.64599609375, -5.2376708984375, -4.829345703125, -4.4210205078125, -4.0126953125, -3.6043701171875, -3.196044921875, -2.7877197265625, -2.37939453125, -1.9710693359375, -1.562744140625, -1.1544189453125, -0.74609375, -0.3377685546875, 0.070556640625, 0.4788818359375, 0.88720703125, 1.2955322265625, 1.703857421875, 2.1121826171875, 2.5205078125, 2.9288330078125, 3.337158203125, 3.7454833984375, 4.15380859375, 4.5621337890625, 4.970458984375, 5.3787841796875, 5.787109375, 6.1954345703125, 6.603759765625, 7.0120849609375, 7.42041015625, 7.8287353515625, 8.237060546875, 8.6453857421875, 9.0537109375, 9.4620361328125, 9.870361328125, 10.2786865234375, 10.68701171875, 11.0953369140625, 11.503662109375, 11.9119873046875, 12.3203125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 7.0, 7.0, 9.0, 7.0, 9.0, 21.0, 22.0, 34.0, 34.0, 64.0, 100.0, 182.0, 286.0, 469.0, 953.0, 1783.0, 3376.0, 7161.0, 16217.0, 45591.0, 302019.0, 2766672.0, 920398.0, 85894.0, 23397.0, 9929.0, 4473.0, 2359.0, 1183.0, 636.0, 369.0, 220.0, 134.0, 76.0, 38.0, 47.0, 17.0, 21.0, 8.0, 13.0, 9.0, 4.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.546875, -26.64990234375, -25.7529296875, -24.85595703125, -23.958984375, -23.06201171875, -22.1650390625, -21.26806640625, -20.37109375, -19.47412109375, -18.5771484375, -17.68017578125, -16.783203125, -15.88623046875, -14.9892578125, -14.09228515625, -13.1953125, -12.29833984375, -11.4013671875, -10.50439453125, -9.607421875, -8.71044921875, -7.8134765625, -6.91650390625, -6.01953125, -5.12255859375, -4.2255859375, -3.32861328125, -2.431640625, -1.53466796875, -0.6376953125, 0.25927734375, 1.15625, 2.05322265625, 2.9501953125, 3.84716796875, 4.744140625, 5.64111328125, 6.5380859375, 7.43505859375, 8.33203125, 9.22900390625, 10.1259765625, 11.02294921875, 11.919921875, 12.81689453125, 13.7138671875, 14.61083984375, 15.5078125, 16.40478515625, 17.3017578125, 18.19873046875, 19.095703125, 19.99267578125, 20.8896484375, 21.78662109375, 22.68359375, 23.58056640625, 24.4775390625, 25.37451171875, 26.271484375, 27.16845703125, 28.0654296875, 28.96240234375, 29.859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 7.0, 2.0, 8.0, 13.0, 13.0, 11.0, 15.0, 27.0, 36.0, 39.0, 59.0, 73.0, 108.0, 162.0, 317.0, 589.0, 842.0, 693.0, 383.0, 228.0, 129.0, 88.0, 61.0, 35.0, 25.0, 29.0, 21.0, 13.0, 12.0, 7.0, 13.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.60205078125, -22.7509765625, -21.89990234375, -21.048828125, -20.19775390625, -19.3466796875, -18.49560546875, -17.64453125, -16.79345703125, -15.9423828125, -15.09130859375, -14.240234375, -13.38916015625, -12.5380859375, -11.68701171875, -10.8359375, -9.98486328125, -9.1337890625, -8.28271484375, -7.431640625, -6.58056640625, -5.7294921875, -4.87841796875, -4.02734375, -3.17626953125, -2.3251953125, -1.47412109375, -0.623046875, 0.22802734375, 1.0791015625, 1.93017578125, 2.78125, 3.63232421875, 4.4833984375, 5.33447265625, 6.185546875, 7.03662109375, 7.8876953125, 8.73876953125, 9.58984375, 10.44091796875, 11.2919921875, 12.14306640625, 12.994140625, 13.84521484375, 14.6962890625, 15.54736328125, 16.3984375, 17.24951171875, 18.1005859375, 18.95166015625, 19.802734375, 20.65380859375, 21.5048828125, 22.35595703125, 23.20703125, 24.05810546875, 24.9091796875, 25.76025390625, 26.611328125, 27.46240234375, 28.3134765625, 29.16455078125, 30.015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 11.0, 16.0, 16.0, 24.0, 33.0, 35.0, 96.0, 138.0, 298.0, 955.0, 4823.0, 52995.0, 3789833.0, 327813.0, 14128.0, 2025.0, 508.0, 175.0, 125.0, 74.0, 35.0, 34.0, 15.0, 18.0, 9.0, 10.0, 12.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-119.25, -116.0048828125, -112.759765625, -109.5146484375, -106.26953125, -103.0244140625, -99.779296875, -96.5341796875, -93.2890625, -90.0439453125, -86.798828125, -83.5537109375, -80.30859375, -77.0634765625, -73.818359375, -70.5732421875, -67.328125, -64.0830078125, -60.837890625, -57.5927734375, -54.34765625, -51.1025390625, -47.857421875, -44.6123046875, -41.3671875, -38.1220703125, -34.876953125, -31.6318359375, -28.38671875, -25.1416015625, -21.896484375, -18.6513671875, -15.40625, -12.1611328125, -8.916015625, -5.6708984375, -2.42578125, 0.8193359375, 4.064453125, 7.3095703125, 10.5546875, 13.7998046875, 17.044921875, 20.2900390625, 23.53515625, 26.7802734375, 30.025390625, 33.2705078125, 36.515625, 39.7607421875, 43.005859375, 46.2509765625, 49.49609375, 52.7412109375, 55.986328125, 59.2314453125, 62.4765625, 65.7216796875, 68.966796875, 72.2119140625, 75.45703125, 78.7021484375, 81.947265625, 85.1923828125, 88.4375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 26.0, 61.0, 182.0, 300.0, 241.0, 135.0, 38.0, 18.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.0019226074219, -386.23809814453125, -378.4742431640625, -370.7104187011719, -362.94659423828125, -355.1827392578125, -347.4189147949219, -339.65509033203125, -331.8912353515625, -324.1274108886719, -316.3635559082031, -308.5997314453125, -300.8359069824219, -293.0720520019531, -285.3082275390625, -277.5444030761719, -269.78057861328125, -262.0167541503906, -254.25291442871094, -246.48907470703125, -238.72523498535156, -230.96139526367188, -223.19757080078125, -215.43373107910156, -207.66989135742188, -199.9060516357422, -192.14222717285156, -184.37838745117188, -176.6145477294922, -168.8507080078125, -161.08688354492188, -153.3230438232422, -145.5592041015625, -137.7953643798828, -130.0315399169922, -122.2677001953125, -114.50386047363281, -106.74002838134766, -98.9761962890625, -91.21235656738281, -83.44851684570312, -75.68468475341797, -67.92084503173828, -60.157012939453125, -52.3931770324707, -44.62934112548828, -36.865509033203125, -29.101673126220703, -21.33783721923828, -13.574002265930176, -5.81016731262207, 1.9536666870117188, 9.71750259399414, 17.481338500976562, 25.24517059326172, 33.00900650024414, 40.77284240722656, 48.536678314208984, 56.300514221191406, 64.06434631347656, 71.82818603515625, 79.5920181274414, 87.35585021972656, 95.11968994140625, 102.8835220336914]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 6.0, 17.0, 6.0, 10.0, 16.0, 20.0, 15.0, 16.0, 22.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 38.0, 34.0, 29.0, 39.0, 41.0, 54.0, 37.0, 36.0, 31.0, 43.0, 26.0, 31.0, 39.0, 23.0, 31.0, 19.0, 23.0, 25.0, 16.0, 11.0, 18.0, 16.0, 13.0, 13.0, 5.0, 4.0, 2.0, 6.0, 8.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-63.54621124267578, -61.51509475708008, -59.48397445678711, -57.452857971191406, -55.42173767089844, -53.390621185302734, -51.35950469970703, -49.32838439941406, -47.29726791381836, -45.266151428222656, -43.23503112792969, -41.203914642333984, -39.17279815673828, -37.14167785644531, -35.11056137084961, -33.079444885253906, -31.048324584960938, -29.0172061920166, -26.986087799072266, -24.954971313476562, -22.923852920532227, -20.89273452758789, -18.861618041992188, -16.83049964904785, -14.799381256103516, -12.76826286315918, -10.73714542388916, -8.70602798461914, -6.674909591674805, -4.643791198730469, -2.612673759460449, -0.5815563201904297, 1.4495697021484375, 3.4806876182556152, 5.511805534362793, 7.542923450469971, 9.574041366577148, 11.605159759521484, 13.636277198791504, 15.667394638061523, 17.69851303100586, 19.729631423950195, 21.76074981689453, 23.791866302490234, 25.82298469543457, 27.854103088378906, 29.88521957397461, 31.916337966918945, 33.94745635986328, 35.978572845458984, 38.00969314575195, 40.040809631347656, 42.071929931640625, 44.10304641723633, 46.13416290283203, 48.165283203125, 50.1963996887207, 52.227516174316406, 54.258636474609375, 56.28975296020508, 58.32086944580078, 60.35198974609375, 62.38310623168945, 64.41422271728516, 66.44534301757812]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 2.0, 11.0, 8.0, 13.0, 18.0, 31.0, 64.0, 78.0, 125.0, 171.0, 296.0, 453.0, 611.0, 1011.0, 1528.0, 2489.0, 3766.0, 6053.0, 9641.0, 15366.0, 25308.0, 41255.0, 67680.0, 109192.0, 170836.0, 216263.0, 142470.0, 89579.0, 55354.0, 33533.0, 20693.0, 12650.0, 8029.0, 5071.0, 3124.0, 2032.0, 1274.0, 840.0, 580.0, 352.0, 242.0, 155.0, 99.0, 65.0, 47.0, 31.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.31201171875, -0.3029136657714844, -0.29381561279296875, -0.2847175598144531, -0.2756195068359375, -0.2665214538574219, -0.25742340087890625, -0.24832534790039062, -0.239227294921875, -0.23012924194335938, -0.22103118896484375, -0.21193313598632812, -0.2028350830078125, -0.19373703002929688, -0.18463897705078125, -0.17554092407226562, -0.16644287109375, -0.15734481811523438, -0.14824676513671875, -0.13914871215820312, -0.1300506591796875, -0.12095260620117188, -0.11185455322265625, -0.10275650024414062, -0.093658447265625, -0.08456039428710938, -0.07546234130859375, -0.06636428833007812, -0.0572662353515625, -0.048168182373046875, -0.03907012939453125, -0.029972076416015625, -0.0208740234375, -0.011775970458984375, -0.00267791748046875, 0.006420135498046875, 0.0155181884765625, 0.024616241455078125, 0.03371429443359375, 0.042812347412109375, 0.051910400390625, 0.061008453369140625, 0.07010650634765625, 0.07920455932617188, 0.0883026123046875, 0.09740066528320312, 0.10649871826171875, 0.11559677124023438, 0.12469482421875, 0.13379287719726562, 0.14289093017578125, 0.15198898315429688, 0.1610870361328125, 0.17018508911132812, 0.17928314208984375, 0.18838119506835938, 0.197479248046875, 0.20657730102539062, 0.21567535400390625, 0.22477340698242188, 0.2338714599609375, 0.24296951293945312, 0.25206756591796875, 0.2611656188964844, 0.270263671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 14.0, 14.0, 18.0, 20.0, 18.0, 15.0, 28.0, 28.0, 28.0, 34.0, 28.0, 31.0, 46.0, 37.0, 35.0, 36.0, 43.0, 1063.0, 28.0, 34.0, 37.0, 25.0, 34.0, 39.0, 29.0, 25.0, 25.0, 30.0, 20.0, 19.0, 17.0, 17.0, 13.0, 15.0, 7.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.6484375, -9.3492431640625, -9.050048828125, -8.7508544921875, -8.45166015625, -8.1524658203125, -7.853271484375, -7.5540771484375, -7.2548828125, -6.9556884765625, -6.656494140625, -6.3572998046875, -6.05810546875, -5.7589111328125, -5.459716796875, -5.1605224609375, -4.861328125, -4.5621337890625, -4.262939453125, -3.9637451171875, -3.66455078125, -3.3653564453125, -3.066162109375, -2.7669677734375, -2.4677734375, -2.1685791015625, -1.869384765625, -1.5701904296875, -1.27099609375, -0.9718017578125, -0.672607421875, -0.3734130859375, -0.07421875, 0.2249755859375, 0.524169921875, 0.8233642578125, 1.12255859375, 1.4217529296875, 1.720947265625, 2.0201416015625, 2.3193359375, 2.6185302734375, 2.917724609375, 3.2169189453125, 3.51611328125, 3.8153076171875, 4.114501953125, 4.4136962890625, 4.712890625, 5.0120849609375, 5.311279296875, 5.6104736328125, 5.90966796875, 6.2088623046875, 6.508056640625, 6.8072509765625, 7.1064453125, 7.4056396484375, 7.704833984375, 8.0040283203125, 8.30322265625, 8.6024169921875, 8.901611328125, 9.2008056640625, 9.5]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 9.0, 17.0, 26.0, 44.0, 60.0, 80.0, 121.0, 174.0, 222.0, 344.0, 459.0, 669.0, 979.0, 1348.0, 1968.0, 2793.0, 4209.0, 6275.0, 9380.0, 14070.0, 21643.0, 33014.0, 51496.0, 80813.0, 133304.0, 1252117.0, 177618.0, 109312.0, 67486.0, 43410.0, 27872.0, 18331.0, 12229.0, 8118.0, 5278.0, 3718.0, 2455.0, 1744.0, 1191.0, 863.0, 556.0, 379.0, 274.0, 203.0, 138.0, 104.0, 73.0, 56.0, 31.0, 15.0, 20.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.1551513671875, -0.150421142578125, -0.14569091796875, -0.140960693359375, -0.13623046875, -0.131500244140625, -0.12677001953125, -0.122039794921875, -0.1173095703125, -0.112579345703125, -0.10784912109375, -0.103118896484375, -0.098388671875, -0.093658447265625, -0.08892822265625, -0.084197998046875, -0.0794677734375, -0.074737548828125, -0.07000732421875, -0.065277099609375, -0.060546875, -0.055816650390625, -0.05108642578125, -0.046356201171875, -0.0416259765625, -0.036895751953125, -0.03216552734375, -0.027435302734375, -0.022705078125, -0.017974853515625, -0.01324462890625, -0.008514404296875, -0.0037841796875, 0.000946044921875, 0.00567626953125, 0.010406494140625, 0.01513671875, 0.019866943359375, 0.02459716796875, 0.029327392578125, 0.0340576171875, 0.038787841796875, 0.04351806640625, 0.048248291015625, 0.052978515625, 0.057708740234375, 0.06243896484375, 0.067169189453125, 0.0718994140625, 0.076629638671875, 0.08135986328125, 0.086090087890625, 0.0908203125, 0.095550537109375, 0.10028076171875, 0.105010986328125, 0.1097412109375, 0.114471435546875, 0.11920166015625, 0.123931884765625, 0.128662109375, 0.133392333984375, 0.13812255859375, 0.142852783203125, 0.1475830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 11.0, 10.0, 15.0, 18.0, 20.0, 27.0, 35.0, 43.0, 51.0, 70.0, 53.0, 62.0, 76.0, 72.0, 79.0, 65.0, 50.0, 42.0, 43.0, 28.0, 19.0, 23.0, 15.0, 17.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010423660278320312, -0.0010128617286682129, -0.0009833574295043945, -0.0009538531303405762, -0.0009243488311767578, -0.0008948445320129395, -0.0008653402328491211, -0.0008358359336853027, -0.0008063316345214844, -0.000776827335357666, -0.0007473230361938477, -0.0007178187370300293, -0.0006883144378662109, -0.0006588101387023926, -0.0006293058395385742, -0.0005998015403747559, -0.0005702972412109375, -0.0005407929420471191, -0.0005112886428833008, -0.0004817843437194824, -0.00045228004455566406, -0.0004227757453918457, -0.00039327144622802734, -0.000363767147064209, -0.0003342628479003906, -0.00030475854873657227, -0.0002752542495727539, -0.00024574995040893555, -0.0002162456512451172, -0.00018674135208129883, -0.00015723705291748047, -0.0001277327537536621, -9.822845458984375e-05, -6.872415542602539e-05, -3.921985626220703e-05, -9.715557098388672e-06, 1.9788742065429688e-05, 4.929304122924805e-05, 7.87973403930664e-05, 0.00010830163955688477, 0.00013780593872070312, 0.00016731023788452148, 0.00019681453704833984, 0.0002263188362121582, 0.00025582313537597656, 0.0002853274345397949, 0.0003148317337036133, 0.00034433603286743164, 0.00037384033203125, 0.00040334463119506836, 0.0004328489303588867, 0.0004623532295227051, 0.0004918575286865234, 0.0005213618278503418, 0.0005508661270141602, 0.0005803704261779785, 0.0006098747253417969, 0.0006393790245056152, 0.0006688833236694336, 0.000698387622833252, 0.0007278919219970703, 0.0007573962211608887, 0.000786900520324707, 0.0008164048194885254, 0.0008459091186523438]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 16.0, 17.0, 23.0, 21.0, 39.0, 49.0, 55.0, 93.0, 169.0, 384.0, 2094.0, 1033817.0, 10620.0, 555.0, 196.0, 112.0, 71.0, 48.0, 32.0, 23.0, 21.0, 16.0, 8.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01959228515625, -0.018908977508544922, -0.018225669860839844, -0.017542362213134766, -0.016859054565429688, -0.01617574691772461, -0.015492439270019531, -0.014809131622314453, -0.014125823974609375, -0.013442516326904297, -0.012759208679199219, -0.01207590103149414, -0.011392593383789062, -0.010709285736083984, -0.010025978088378906, -0.009342670440673828, -0.00865936279296875, -0.007976055145263672, -0.007292747497558594, -0.006609439849853516, -0.0059261322021484375, -0.005242824554443359, -0.004559516906738281, -0.003876209259033203, -0.003192901611328125, -0.002509593963623047, -0.0018262863159179688, -0.0011429786682128906, -0.0004596710205078125, 0.00022363662719726562, 0.0009069442749023438, 0.0015902519226074219, 0.0022735595703125, 0.002956867218017578, 0.0036401748657226562, 0.004323482513427734, 0.0050067901611328125, 0.005690097808837891, 0.006373405456542969, 0.007056713104248047, 0.007740020751953125, 0.008423328399658203, 0.009106636047363281, 0.00978994369506836, 0.010473251342773438, 0.011156558990478516, 0.011839866638183594, 0.012523174285888672, 0.01320648193359375, 0.013889789581298828, 0.014573097229003906, 0.015256404876708984, 0.015939712524414062, 0.01662302017211914, 0.01730632781982422, 0.017989635467529297, 0.018672943115234375, 0.019356250762939453, 0.02003955841064453, 0.02072286605834961, 0.021406173706054688, 0.022089481353759766, 0.022772789001464844, 0.023456096649169922, 0.024139404296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 21.0, 994.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027796540409326553, -0.02728552557528019, -0.026774512603878975, -0.02626349776983261, -0.025752484798431396, -0.025241469964385033, -0.024730456992983818, -0.024219442158937454, -0.02370842918753624, -0.023197414353489876, -0.02268640138208866, -0.022175386548042297, -0.021664373576641083, -0.02115335874259472, -0.020642345771193504, -0.02013133093714714, -0.019620317965745926, -0.019109303131699562, -0.018598290160298347, -0.018087275326251984, -0.01757626235485077, -0.017065247520804405, -0.01655423454940319, -0.016043219715356827, -0.015532204881310463, -0.015021190978586674, -0.014510177075862885, -0.013999163173139095, -0.013488149270415306, -0.012977135367691517, -0.012466121464967728, -0.011955106630921364, -0.011444094590842724, -0.010933080688118935, -0.010422066785395145, -0.009911052882671356, -0.009400038979947567, -0.008889025077223778, -0.008378010243177414, -0.0078669972717762, -0.007355982903391123, -0.006844969000667334, -0.006333955097943544, -0.005822940729558468, -0.005311926826834679, -0.0048009129241108894, -0.0042898990213871, -0.003778885118663311, -0.003267871215939522, -0.0027568573132157326, -0.0022458434104919434, -0.0017348292749375105, -0.0012238153722137213, -0.0007128014694899321, -0.0002017873339354992, 0.00030922656878829, 0.0008202404715120792, 0.0013312543742358685, 0.0018422683933749795, 0.0023532824125140905, 0.0028642963152378798, 0.003375310217961669, 0.003886324353516102, 0.004397338256239891, 0.00490835215896368]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 20.0, 20.0, 48.0, 35.0, 46.0, 70.0, 59.0, 57.0, 97.0, 95.0, 87.0, 54.0, 69.0, 55.0, 51.0, 39.0, 20.0, 31.0, 17.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010976195335388184, -0.0010590441524982452, -0.0010204687714576721, -0.000981893390417099, -0.0009433180093765259, -0.0009047426283359528, -0.0008661672472953796, -0.0008275918662548065, -0.0007890164852142334, -0.0007504411041736603, -0.0007118657231330872, -0.000673290342092514, -0.0006347149610519409, -0.0005961395800113678, -0.0005575641989707947, -0.0005189888179302216, -0.00048041343688964844, -0.0004418380558490753, -0.0004032626748085022, -0.0003646872937679291, -0.00032611191272735596, -0.00028753653168678284, -0.0002489611506462097, -0.0002103857696056366, -0.00017181038856506348, -0.00013323500752449036, -9.465962648391724e-05, -5.6084245443344116e-05, -1.7508864402770996e-05, 2.1066516637802124e-05, 5.9641897678375244e-05, 9.821727871894836e-05, 0.00013679265975952148, 0.0001753680408000946, 0.00021394342184066772, 0.00025251880288124084, 0.00029109418392181396, 0.0003296695649623871, 0.0003682449460029602, 0.0004068203270435333, 0.00044539570808410645, 0.00048397108912467957, 0.0005225464701652527, 0.0005611218512058258, 0.0005996972322463989, 0.000638272613286972, 0.0006768479943275452, 0.0007154233753681183, 0.0007539987564086914, 0.0007925741374492645, 0.0008311495184898376, 0.0008697248995304108, 0.0009083002805709839, 0.000946875661611557, 0.0009854510426521301, 0.0010240264236927032, 0.0010626018047332764, 0.0011011771857738495, 0.0011397525668144226, 0.0011783279478549957, 0.0012169033288955688, 0.001255478709936142, 0.001294054090976715, 0.0013326294720172882, 0.0013712048530578613]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 12.0, 12.0, 8.0, 24.0, 21.0, 32.0, 56.0, 75.0, 100.0, 174.0, 268.0, 451.0, 760.0, 1283.0, 2078.0, 3496.0, 6501.0, 13329.0, 67869.0, 842644.0, 79158.0, 14402.0, 6640.0, 3655.0, 2162.0, 1283.0, 775.0, 482.0, 283.0, 171.0, 96.0, 73.0, 47.0, 39.0, 22.0, 18.0, 8.0, 12.0, 8.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.875, -27.01806640625, -26.1611328125, -25.30419921875, -24.447265625, -23.59033203125, -22.7333984375, -21.87646484375, -21.01953125, -20.16259765625, -19.3056640625, -18.44873046875, -17.591796875, -16.73486328125, -15.8779296875, -15.02099609375, -14.1640625, -13.30712890625, -12.4501953125, -11.59326171875, -10.736328125, -9.87939453125, -9.0224609375, -8.16552734375, -7.30859375, -6.45166015625, -5.5947265625, -4.73779296875, -3.880859375, -3.02392578125, -2.1669921875, -1.31005859375, -0.453125, 0.40380859375, 1.2607421875, 2.11767578125, 2.974609375, 3.83154296875, 4.6884765625, 5.54541015625, 6.40234375, 7.25927734375, 8.1162109375, 8.97314453125, 9.830078125, 10.68701171875, 11.5439453125, 12.40087890625, 13.2578125, 14.11474609375, 14.9716796875, 15.82861328125, 16.685546875, 17.54248046875, 18.3994140625, 19.25634765625, 20.11328125, 20.97021484375, 21.8271484375, 22.68408203125, 23.541015625, 24.39794921875, 25.2548828125, 26.11181640625, 26.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 3.0, 7.0, 12.0, 20.0, 14.0, 16.0, 17.0, 25.0, 24.0, 41.0, 28.0, 39.0, 48.0, 55.0, 69.0, 79.0, 487.0, 1585.0, 85.0, 58.0, 48.0, 42.0, 54.0, 33.0, 32.0, 27.0, 29.0, 13.0, 9.0, 14.0, 10.0, 8.0, 1.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.951171875, -43.40234375, -41.853515625, -40.3046875, -38.755859375, -37.20703125, -35.658203125, -34.109375, -32.560546875, -31.01171875, -29.462890625, -27.9140625, -26.365234375, -24.81640625, -23.267578125, -21.71875, -20.169921875, -18.62109375, -17.072265625, -15.5234375, -13.974609375, -12.42578125, -10.876953125, -9.328125, -7.779296875, -6.23046875, -4.681640625, -3.1328125, -1.583984375, -0.03515625, 1.513671875, 3.0625, 4.611328125, 6.16015625, 7.708984375, 9.2578125, 10.806640625, 12.35546875, 13.904296875, 15.453125, 17.001953125, 18.55078125, 20.099609375, 21.6484375, 23.197265625, 24.74609375, 26.294921875, 27.84375, 29.392578125, 30.94140625, 32.490234375, 34.0390625, 35.587890625, 37.13671875, 38.685546875, 40.234375, 41.783203125, 43.33203125, 44.880859375, 46.4296875, 47.978515625, 49.52734375, 51.076171875, 52.625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 16.0, 13.0, 17.0, 17.0, 29.0, 39.0, 43.0, 73.0, 107.0, 155.0, 434.0, 1715.0, 8807.0, 339904.0, 2779294.0, 11713.0, 2169.0, 508.0, 195.0, 107.0, 67.0, 59.0, 43.0, 32.0, 33.0, 18.0, 14.0, 14.0, 21.0, 12.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-86.5, -83.884765625, -81.26953125, -78.654296875, -76.0390625, -73.423828125, -70.80859375, -68.193359375, -65.578125, -62.962890625, -60.34765625, -57.732421875, -55.1171875, -52.501953125, -49.88671875, -47.271484375, -44.65625, -42.041015625, -39.42578125, -36.810546875, -34.1953125, -31.580078125, -28.96484375, -26.349609375, -23.734375, -21.119140625, -18.50390625, -15.888671875, -13.2734375, -10.658203125, -8.04296875, -5.427734375, -2.8125, -0.197265625, 2.41796875, 5.033203125, 7.6484375, 10.263671875, 12.87890625, 15.494140625, 18.109375, 20.724609375, 23.33984375, 25.955078125, 28.5703125, 31.185546875, 33.80078125, 36.416015625, 39.03125, 41.646484375, 44.26171875, 46.876953125, 49.4921875, 52.107421875, 54.72265625, 57.337890625, 59.953125, 62.568359375, 65.18359375, 67.798828125, 70.4140625, 73.029296875, 75.64453125, 78.259765625, 80.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 19.0, 228.0, 602.0, 151.0, 15.0, 0.0, 1.0, 0.0, 1.0], "bins": [-409.54376220703125, -402.4053955078125, -395.26702880859375, -388.128662109375, -380.99029541015625, -373.8519287109375, -366.71356201171875, -359.5751953125, -352.43682861328125, -345.2984619140625, -338.16009521484375, -331.021728515625, -323.88336181640625, -316.7449951171875, -309.60662841796875, -302.46826171875, -295.3298645019531, -288.1914978027344, -281.0531311035156, -273.9147644042969, -266.7763977050781, -259.6380310058594, -252.49964904785156, -245.3612823486328, -238.22291564941406, -231.0845489501953, -223.94618225097656, -216.8078155517578, -209.66943359375, -202.53106689453125, -195.3927001953125, -188.25433349609375, -181.115966796875, -173.97760009765625, -166.8392333984375, -159.70086669921875, -152.5625, -145.42413330078125, -138.28575134277344, -131.1473846435547, -124.00901794433594, -116.87065124511719, -109.73228454589844, -102.59391021728516, -95.4555435180664, -88.31717681884766, -81.17880249023438, -74.04043579101562, -66.90206909179688, -59.763702392578125, -52.62533187866211, -45.486961364746094, -38.348594665527344, -31.210227966308594, -24.071857452392578, -16.933486938476562, -9.795124053955078, -2.6567554473876953, 4.4816131591796875, 11.61998176574707, 18.758350372314453, 25.896717071533203, 33.03508758544922, 40.173458099365234, 47.311824798583984]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 8.0, 4.0, 7.0, 15.0, 8.0, 9.0, 12.0, 17.0, 16.0, 25.0, 19.0, 31.0, 26.0, 30.0, 27.0, 38.0, 42.0, 36.0, 47.0, 52.0, 54.0, 52.0, 34.0, 44.0, 39.0, 39.0, 36.0, 24.0, 35.0, 22.0, 20.0, 18.0, 16.0, 25.0, 13.0, 17.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-114.6417236328125, -111.21849822998047, -107.79527282714844, -104.37203979492188, -100.94881439208984, -97.52558898925781, -94.10236358642578, -90.67913818359375, -87.25590515136719, -83.83267974853516, -80.40945434570312, -76.98622131347656, -73.56299591064453, -70.1397705078125, -66.71654510498047, -63.29331970214844, -59.870094299316406, -56.446868896484375, -53.02363967895508, -49.60041427612305, -46.17718505859375, -42.75395965576172, -39.33073425292969, -35.907508850097656, -32.48427963256836, -29.061052322387695, -25.63782501220703, -22.214599609375, -18.791372299194336, -15.368144989013672, -11.94491958618164, -8.521692276000977, -5.098457336425781, -1.6752305030822754, 1.7479963302612305, 5.171222686767578, 8.594449996948242, 12.017677307128906, 15.440902709960938, 18.8641300201416, 22.287357330322266, 25.71058464050293, 29.133811950683594, 32.557037353515625, 35.980262756347656, 39.40349197387695, 42.826717376708984, 46.24994659423828, 49.67317199707031, 53.096397399902344, 56.51962661743164, 59.94285202026367, 63.36608123779297, 66.789306640625, 70.21253204345703, 73.63575744628906, 77.05899047851562, 80.48221588134766, 83.90544128417969, 87.32867431640625, 90.75189971923828, 94.17512512207031, 97.59835052490234, 101.02157592773438, 104.4448013305664]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 9.0, 19.0, 18.0, 25.0, 24.0, 22.0, 39.0, 29.0, 33.0, 30.0, 34.0, 32.0, 51.0, 44.0, 42.0, 46.0, 53.0, 42.0, 40.0, 33.0, 46.0, 36.0, 29.0, 38.0, 35.0, 29.0, 22.0, 15.0, 16.0, 7.0, 11.0, 5.0, 8.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.25, -15.7802734375, -15.310546875, -14.8408203125, -14.37109375, -13.9013671875, -13.431640625, -12.9619140625, -12.4921875, -12.0224609375, -11.552734375, -11.0830078125, -10.61328125, -10.1435546875, -9.673828125, -9.2041015625, -8.734375, -8.2646484375, -7.794921875, -7.3251953125, -6.85546875, -6.3857421875, -5.916015625, -5.4462890625, -4.9765625, -4.5068359375, -4.037109375, -3.5673828125, -3.09765625, -2.6279296875, -2.158203125, -1.6884765625, -1.21875, -0.7490234375, -0.279296875, 0.1904296875, 0.66015625, 1.1298828125, 1.599609375, 2.0693359375, 2.5390625, 3.0087890625, 3.478515625, 3.9482421875, 4.41796875, 4.8876953125, 5.357421875, 5.8271484375, 6.296875, 6.7666015625, 7.236328125, 7.7060546875, 8.17578125, 8.6455078125, 9.115234375, 9.5849609375, 10.0546875, 10.5244140625, 10.994140625, 11.4638671875, 11.93359375, 12.4033203125, 12.873046875, 13.3427734375, 13.8125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 2.0, 8.0, 12.0, 22.0, 26.0, 35.0, 39.0, 79.0, 126.0, 196.0, 348.0, 666.0, 1457.0, 3202.0, 7336.0, 18503.0, 62129.0, 600904.0, 3030853.0, 391512.0, 49195.0, 15962.0, 6419.0, 2653.0, 1208.0, 554.0, 321.0, 195.0, 105.0, 73.0, 38.0, 26.0, 12.0, 18.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.4375, -34.407958984375, -33.37841796875, -32.348876953125, -31.3193359375, -30.289794921875, -29.26025390625, -28.230712890625, -27.201171875, -26.171630859375, -25.14208984375, -24.112548828125, -23.0830078125, -22.053466796875, -21.02392578125, -19.994384765625, -18.96484375, -17.935302734375, -16.90576171875, -15.876220703125, -14.8466796875, -13.817138671875, -12.78759765625, -11.758056640625, -10.728515625, -9.698974609375, -8.66943359375, -7.639892578125, -6.6103515625, -5.580810546875, -4.55126953125, -3.521728515625, -2.4921875, -1.462646484375, -0.43310546875, 0.596435546875, 1.6259765625, 2.655517578125, 3.68505859375, 4.714599609375, 5.744140625, 6.773681640625, 7.80322265625, 8.832763671875, 9.8623046875, 10.891845703125, 11.92138671875, 12.950927734375, 13.98046875, 15.010009765625, 16.03955078125, 17.069091796875, 18.0986328125, 19.128173828125, 20.15771484375, 21.187255859375, 22.216796875, 23.246337890625, 24.27587890625, 25.305419921875, 26.3349609375, 27.364501953125, 28.39404296875, 29.423583984375, 30.453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 19.0, 24.0, 44.0, 58.0, 87.0, 179.0, 357.0, 914.0, 1239.0, 578.0, 265.0, 121.0, 56.0, 28.0, 38.0, 14.0, 6.0, 12.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -51.07080078125, -49.7353515625, -48.39990234375, -47.064453125, -45.72900390625, -44.3935546875, -43.05810546875, -41.72265625, -40.38720703125, -39.0517578125, -37.71630859375, -36.380859375, -35.04541015625, -33.7099609375, -32.37451171875, -31.0390625, -29.70361328125, -28.3681640625, -27.03271484375, -25.697265625, -24.36181640625, -23.0263671875, -21.69091796875, -20.35546875, -19.02001953125, -17.6845703125, -16.34912109375, -15.013671875, -13.67822265625, -12.3427734375, -11.00732421875, -9.671875, -8.33642578125, -7.0009765625, -5.66552734375, -4.330078125, -2.99462890625, -1.6591796875, -0.32373046875, 1.01171875, 2.34716796875, 3.6826171875, 5.01806640625, 6.353515625, 7.68896484375, 9.0244140625, 10.35986328125, 11.6953125, 13.03076171875, 14.3662109375, 15.70166015625, 17.037109375, 18.37255859375, 19.7080078125, 21.04345703125, 22.37890625, 23.71435546875, 25.0498046875, 26.38525390625, 27.720703125, 29.05615234375, 30.3916015625, 31.72705078125, 33.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 10.0, 16.0, 28.0, 67.0, 96.0, 263.0, 568.0, 2158.0, 16275.0, 559943.0, 3571722.0, 38117.0, 3546.0, 806.0, 332.0, 142.0, 72.0, 37.0, 38.0, 15.0, 4.0, 9.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.8125, -66.5126953125, -63.212890625, -59.9130859375, -56.61328125, -53.3134765625, -50.013671875, -46.7138671875, -43.4140625, -40.1142578125, -36.814453125, -33.5146484375, -30.21484375, -26.9150390625, -23.615234375, -20.3154296875, -17.015625, -13.7158203125, -10.416015625, -7.1162109375, -3.81640625, -0.5166015625, 2.783203125, 6.0830078125, 9.3828125, 12.6826171875, 15.982421875, 19.2822265625, 22.58203125, 25.8818359375, 29.181640625, 32.4814453125, 35.78125, 39.0810546875, 42.380859375, 45.6806640625, 48.98046875, 52.2802734375, 55.580078125, 58.8798828125, 62.1796875, 65.4794921875, 68.779296875, 72.0791015625, 75.37890625, 78.6787109375, 81.978515625, 85.2783203125, 88.578125, 91.8779296875, 95.177734375, 98.4775390625, 101.77734375, 105.0771484375, 108.376953125, 111.6767578125, 114.9765625, 118.2763671875, 121.576171875, 124.8759765625, 128.17578125, 131.4755859375, 134.775390625, 138.0751953125, 141.375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 68.0, 183.0, 338.0, 259.0, 104.0, 23.0, 11.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5100860595703, -227.67068481445312, -218.83128356933594, -209.99188232421875, -201.15248107910156, -192.31307983398438, -183.47369384765625, -174.63427734375, -165.79489135742188, -156.9554901123047, -148.1160888671875, -139.2766876220703, -130.43728637695312, -121.59788513183594, -112.75849151611328, -103.9190902709961, -95.07968139648438, -86.24028015136719, -77.40087890625, -68.56147766113281, -59.72208023071289, -50.8826789855957, -42.04328155517578, -33.203880310058594, -24.364479064941406, -15.525078773498535, -6.685678482055664, 2.1537208557128906, 10.993122100830078, 19.832523345947266, 28.671920776367188, 37.511322021484375, 46.350738525390625, 55.19013977050781, 64.029541015625, 72.86894226074219, 81.70834350585938, 90.54774475097656, 99.38713836669922, 108.2265396118164, 117.0659408569336, 125.90534210205078, 134.74473571777344, 143.58413696289062, 152.4235382080078, 161.262939453125, 170.1023406982422, 178.94174194335938, 187.78114318847656, 196.62054443359375, 205.45994567871094, 214.29934692382812, 223.1387481689453, 231.9781494140625, 240.81753540039062, 249.65695190429688, 258.496337890625, 267.3357238769531, 276.1751403808594, 285.0145263671875, 293.85394287109375, 302.6933288574219, 311.5327453613281, 320.37213134765625, 329.2115478515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 7.0, 15.0, 16.0, 24.0, 23.0, 29.0, 32.0, 32.0, 26.0, 39.0, 33.0, 45.0, 36.0, 44.0, 64.0, 47.0, 53.0, 44.0, 44.0, 46.0, 42.0, 38.0, 27.0, 23.0, 21.0, 23.0, 13.0, 9.0, 13.0, 11.0, 13.0, 6.0, 8.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.86015319824219, -84.16903686523438, -81.47792053222656, -78.78680419921875, -76.09568786621094, -73.40457153320312, -70.71345520019531, -68.02234649658203, -65.33123016357422, -62.640113830566406, -59.948997497558594, -57.25788116455078, -54.566768646240234, -51.87565231323242, -49.18453598022461, -46.49342346191406, -43.802303314208984, -41.11118698120117, -38.42007064819336, -35.72895812988281, -33.037841796875, -30.346725463867188, -27.655609130859375, -24.964494705200195, -22.273378372192383, -19.58226203918457, -16.89114761352539, -14.200031280517578, -11.508915901184082, -8.817800521850586, -6.126684188842773, -3.4355697631835938, -0.7444534301757812, 1.946662187576294, 4.637777805328369, 7.328893661499023, 10.02000904083252, 12.711124420166016, 15.402240753173828, 18.093355178833008, 20.78447151184082, 23.475587844848633, 26.166702270507812, 28.857818603515625, 31.548934936523438, 34.24005126953125, 36.93116760253906, 39.62228012084961, 42.31339645385742, 45.004512786865234, 47.69562911987305, 50.386741638183594, 53.077857971191406, 55.76897430419922, 58.46009063720703, 61.151206970214844, 63.842323303222656, 66.53343963623047, 69.22455596923828, 71.9156723022461, 74.6067886352539, 77.29789733886719, 79.989013671875, 82.68013000488281, 85.37124633789062]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 14.0, 26.0, 34.0, 49.0, 81.0, 90.0, 144.0, 205.0, 301.0, 392.0, 578.0, 774.0, 1100.0, 1631.0, 2299.0, 3372.0, 4837.0, 7355.0, 10752.0, 15642.0, 22850.0, 34038.0, 49726.0, 72827.0, 108253.0, 162610.0, 178455.0, 118871.0, 79991.0, 54474.0, 37246.0, 25333.0, 17239.0, 11485.0, 7981.0, 5412.0, 3644.0, 2532.0, 1692.0, 1283.0, 881.0, 677.0, 424.0, 299.0, 194.0, 137.0, 103.0, 62.0, 52.0, 28.0, 35.0, 17.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0], "bins": [-0.247802734375, -0.24008750915527344, -0.23237228393554688, -0.2246570587158203, -0.21694183349609375, -0.2092266082763672, -0.20151138305664062, -0.19379615783691406, -0.1860809326171875, -0.17836570739746094, -0.17065048217773438, -0.1629352569580078, -0.15522003173828125, -0.1475048065185547, -0.13978958129882812, -0.13207435607910156, -0.124359130859375, -0.11664390563964844, -0.10892868041992188, -0.10121345520019531, -0.09349822998046875, -0.08578300476074219, -0.07806777954101562, -0.07035255432128906, -0.0626373291015625, -0.05492210388183594, -0.047206878662109375, -0.03949165344238281, -0.03177642822265625, -0.024061203002929688, -0.016345977783203125, -0.008630752563476562, -0.00091552734375, 0.0067996978759765625, 0.014514923095703125, 0.022230148315429688, 0.02994537353515625, 0.03766059875488281, 0.045375823974609375, 0.05309104919433594, 0.0608062744140625, 0.06852149963378906, 0.07623672485351562, 0.08395195007324219, 0.09166717529296875, 0.09938240051269531, 0.10709762573242188, 0.11481285095214844, 0.122528076171875, 0.13024330139160156, 0.13795852661132812, 0.1456737518310547, 0.15338897705078125, 0.1611042022705078, 0.16881942749023438, 0.17653465270996094, 0.1842498779296875, 0.19196510314941406, 0.19968032836914062, 0.2073955535888672, 0.21511077880859375, 0.2228260040283203, 0.23054122924804688, 0.23825645446777344, 0.2459716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 11.0, 8.0, 11.0, 12.0, 17.0, 25.0, 20.0, 23.0, 31.0, 26.0, 32.0, 46.0, 38.0, 48.0, 51.0, 37.0, 34.0, 1070.0, 41.0, 54.0, 40.0, 37.0, 40.0, 42.0, 33.0, 31.0, 21.0, 31.0, 19.0, 13.0, 21.0, 8.0, 12.0, 7.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.1328125, -13.7530517578125, -13.373291015625, -12.9935302734375, -12.61376953125, -12.2340087890625, -11.854248046875, -11.4744873046875, -11.0947265625, -10.7149658203125, -10.335205078125, -9.9554443359375, -9.57568359375, -9.1959228515625, -8.816162109375, -8.4364013671875, -8.056640625, -7.6768798828125, -7.297119140625, -6.9173583984375, -6.53759765625, -6.1578369140625, -5.778076171875, -5.3983154296875, -5.0185546875, -4.6387939453125, -4.259033203125, -3.8792724609375, -3.49951171875, -3.1197509765625, -2.739990234375, -2.3602294921875, -1.98046875, -1.6007080078125, -1.220947265625, -0.8411865234375, -0.46142578125, -0.0816650390625, 0.298095703125, 0.6778564453125, 1.0576171875, 1.4373779296875, 1.817138671875, 2.1968994140625, 2.57666015625, 2.9564208984375, 3.336181640625, 3.7159423828125, 4.095703125, 4.4754638671875, 4.855224609375, 5.2349853515625, 5.61474609375, 5.9945068359375, 6.374267578125, 6.7540283203125, 7.1337890625, 7.5135498046875, 7.893310546875, 8.2730712890625, 8.65283203125, 9.0325927734375, 9.412353515625, 9.7921142578125, 10.171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 83.0, 130.0, 238.0, 346.0, 573.0, 1062.0, 1704.0, 2788.0, 4731.0, 7675.0, 13309.0, 22927.0, 40266.0, 73250.0, 143613.0, 1320608.0, 219563.0, 109297.0, 57836.0, 32055.0, 18261.0, 10751.0, 6283.0, 3841.0, 2210.0, 1425.0, 859.0, 492.0, 319.0, 182.0, 101.0, 75.0, 51.0, 30.0, 18.0, 16.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2265625, -0.21965599060058594, -0.21274948120117188, -0.2058429718017578, -0.19893646240234375, -0.1920299530029297, -0.18512344360351562, -0.17821693420410156, -0.1713104248046875, -0.16440391540527344, -0.15749740600585938, -0.1505908966064453, -0.14368438720703125, -0.1367778778076172, -0.12987136840820312, -0.12296485900878906, -0.116058349609375, -0.10915184020996094, -0.10224533081054688, -0.09533882141113281, -0.08843231201171875, -0.08152580261230469, -0.07461929321289062, -0.06771278381347656, -0.0608062744140625, -0.05389976501464844, -0.046993255615234375, -0.04008674621582031, -0.03318023681640625, -0.026273727416992188, -0.019367218017578125, -0.012460708618164062, -0.00555419921875, 0.0013523101806640625, 0.008258819580078125, 0.015165328979492188, 0.02207183837890625, 0.028978347778320312, 0.035884857177734375, 0.04279136657714844, 0.0496978759765625, 0.05660438537597656, 0.06351089477539062, 0.07041740417480469, 0.07732391357421875, 0.08423042297363281, 0.09113693237304688, 0.09804344177246094, 0.104949951171875, 0.11185646057128906, 0.11876296997070312, 0.1256694793701172, 0.13257598876953125, 0.1394824981689453, 0.14638900756835938, 0.15329551696777344, 0.1602020263671875, 0.16710853576660156, 0.17401504516601562, 0.1809215545654297, 0.18782806396484375, 0.1947345733642578, 0.20164108276367188, 0.20854759216308594, 0.2154541015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 14.0, 14.0, 6.0, 20.0, 11.0, 20.0, 16.0, 17.0, 25.0, 30.0, 35.0, 44.0, 26.0, 27.0, 45.0, 42.0, 58.0, 51.0, 53.0, 46.0, 39.0, 52.0, 36.0, 30.0, 24.0, 30.0, 28.0, 18.0, 22.0, 21.0, 10.0, 18.0, 16.0, 7.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003867149353027344, -0.00037195533514022827, -0.00035719573497772217, -0.00034243613481521606, -0.00032767653465270996, -0.00031291693449020386, -0.00029815733432769775, -0.00028339773416519165, -0.00026863813400268555, -0.00025387853384017944, -0.00023911893367767334, -0.00022435933351516724, -0.00020959973335266113, -0.00019484013319015503, -0.00018008053302764893, -0.00016532093286514282, -0.00015056133270263672, -0.00013580173254013062, -0.00012104213237762451, -0.00010628253221511841, -9.15229320526123e-05, -7.67633318901062e-05, -6.20037317276001e-05, -4.7244131565093994e-05, -3.248453140258789e-05, -1.7724931240081787e-05, -2.9653310775756836e-06, 1.179426908493042e-05, 2.6553869247436523e-05, 4.131346940994263e-05, 5.607306957244873e-05, 7.083266973495483e-05, 8.559226989746094e-05, 0.00010035187005996704, 0.00011511147022247314, 0.00012987107038497925, 0.00014463067054748535, 0.00015939027070999146, 0.00017414987087249756, 0.00018890947103500366, 0.00020366907119750977, 0.00021842867136001587, 0.00023318827152252197, 0.0002479478716850281, 0.0002627074718475342, 0.0002774670720100403, 0.0002922266721725464, 0.0003069862723350525, 0.0003217458724975586, 0.0003365054726600647, 0.0003512650728225708, 0.0003660246729850769, 0.000380784273147583, 0.0003955438733100891, 0.0004103034734725952, 0.0004250630736351013, 0.0004398226737976074, 0.0004545822739601135, 0.00046934187412261963, 0.00048410147428512573, 0.0004988610744476318, 0.0005136206746101379, 0.000528380274772644, 0.0005431398749351501, 0.0005578994750976562]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 11.0, 15.0, 18.0, 22.0, 17.0, 26.0, 34.0, 33.0, 41.0, 68.0, 102.0, 181.0, 303.0, 863.0, 20004.0, 1019707.0, 5481.0, 678.0, 315.0, 130.0, 87.0, 69.0, 68.0, 40.0, 43.0, 28.0, 15.0, 21.0, 15.0, 14.0, 15.0, 6.0, 10.0, 16.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.0124359130859375, -0.01210319995880127, -0.011770486831665039, -0.011437773704528809, -0.011105060577392578, -0.010772347450256348, -0.010439634323120117, -0.010106921195983887, -0.009774208068847656, -0.009441494941711426, -0.009108781814575195, -0.008776068687438965, -0.008443355560302734, -0.008110642433166504, -0.0077779293060302734, -0.007445216178894043, -0.0071125030517578125, -0.006779789924621582, -0.0064470767974853516, -0.006114363670349121, -0.005781650543212891, -0.00544893741607666, -0.00511622428894043, -0.004783511161804199, -0.004450798034667969, -0.004118084907531738, -0.003785371780395508, -0.0034526586532592773, -0.003119945526123047, -0.0027872323989868164, -0.002454519271850586, -0.0021218061447143555, -0.001789093017578125, -0.0014563798904418945, -0.001123666763305664, -0.0007909536361694336, -0.0004582405090332031, -0.00012552738189697266, 0.0002071857452392578, 0.0005398988723754883, 0.0008726119995117188, 0.0012053251266479492, 0.0015380382537841797, 0.0018707513809204102, 0.0022034645080566406, 0.002536177635192871, 0.0028688907623291016, 0.003201603889465332, 0.0035343170166015625, 0.003867030143737793, 0.0041997432708740234, 0.004532456398010254, 0.004865169525146484, 0.005197882652282715, 0.005530595779418945, 0.005863308906555176, 0.006196022033691406, 0.006528735160827637, 0.006861448287963867, 0.007194161415100098, 0.007526874542236328, 0.007859587669372559, 0.008192300796508789, 0.00852501392364502, 0.00885772705078125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 371.0, 641.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011258742772042751, -0.011014152318239212, -0.010769560933113098, -0.010524969547986984, -0.010280379094183445, -0.010035788640379906, -0.009791197255253792, -0.009546605870127678, -0.009302015416324139, -0.0090574249625206, -0.008812833577394485, -0.008568242192268372, -0.008323651738464832, -0.008079061284661293, -0.00783446989953518, -0.0075898789800703526, -0.007345288060605526, -0.007100697141140699, -0.006856106221675873, -0.006611515302211046, -0.00636692438274622, -0.006122333463281393, -0.0058777425438165665, -0.00563315162435174, -0.005388560704886913, -0.005143969785422087, -0.00489937886595726, -0.0046547879464924335, -0.004410197027027607, -0.00416560610756278, -0.003921015188097954, -0.003676424268633127, -0.0034318342804908752, -0.0031872433610260487, -0.002942652441561222, -0.0026980615220963955, -0.002453470602631569, -0.0022088796831667423, -0.0019642887637019157, -0.0017196978442370892, -0.0014751069247722626, -0.001230516005307436, -0.0009859250858426094, -0.0007413341663777828, -0.0004967432469129562, -0.00025215232744812965, -7.56140798330307e-06, 0.00023702951148152351, 0.0004816204309463501, 0.0007262113504111767, 0.0009708022698760033, 0.0012153931893408298, 0.0014599841088056564, 0.001704575028270483, 0.0019491659477353096, 0.002193756867200136, 0.0024383477866649628, 0.0026829387061297894, 0.002927529625594616, 0.0031721205450594425, 0.003416711464524269, 0.0036613023839890957, 0.0039058933034539223, 0.004150484222918749, 0.0043950751423835754]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 17.0, 32.0, 35.0, 48.0, 63.0, 81.0, 103.0, 116.0, 107.0, 86.0, 84.0, 74.0, 44.0, 36.0, 28.0, 22.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000894010066986084, -0.00086224265396595, -0.000830475240945816, -0.0007987078279256821, -0.0007669404149055481, -0.0007351730018854141, -0.0007034055888652802, -0.0006716381758451462, -0.0006398707628250122, -0.0006081033498048782, -0.0005763359367847443, -0.0005445685237646103, -0.0005128011107444763, -0.00048103369772434235, -0.0004492662847042084, -0.0004174988716840744, -0.00038573145866394043, -0.00035396404564380646, -0.0003221966326236725, -0.0002904292196035385, -0.00025866180658340454, -0.00022689439356327057, -0.0001951269805431366, -0.00016335956752300262, -0.00013159215450286865, -9.982474148273468e-05, -6.805732846260071e-05, -3.6289915442466736e-05, -4.522502422332764e-06, 2.724491059780121e-05, 5.901232361793518e-05, 9.077973663806915e-05, 0.00012254714965820312, 0.0001543145626783371, 0.00018608197569847107, 0.00021784938871860504, 0.000249616801738739, 0.000281384214758873, 0.00031315162777900696, 0.00034491904079914093, 0.0003766864538192749, 0.0004084538668394089, 0.00044022127985954285, 0.0004719886928796768, 0.0005037561058998108, 0.0005355235189199448, 0.0005672909319400787, 0.0005990583449602127, 0.0006308257579803467, 0.0006625931710004807, 0.0006943605840206146, 0.0007261279970407486, 0.0007578954100608826, 0.0007896628230810165, 0.0008214302361011505, 0.0008531976491212845, 0.0008849650621414185, 0.0009167324751615524, 0.0009484998881816864, 0.0009802673012018204, 0.0010120347142219543, 0.0010438021272420883, 0.0010755695402622223, 0.0011073369532823563, 0.0011391043663024902]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 14.0, 21.0, 16.0, 32.0, 31.0, 53.0, 78.0, 100.0, 136.0, 187.0, 293.0, 444.0, 683.0, 1071.0, 1834.0, 3074.0, 5362.0, 9188.0, 17119.0, 46504.0, 736559.0, 168389.0, 27006.0, 12746.0, 7052.0, 4042.0, 2417.0, 1438.0, 879.0, 542.0, 387.0, 227.0, 150.0, 117.0, 72.0, 67.0, 52.0, 31.0, 20.0, 21.0, 19.0, 16.0, 15.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.234375, -27.372802734375, -26.51123046875, -25.649658203125, -24.7880859375, -23.926513671875, -23.06494140625, -22.203369140625, -21.341796875, -20.480224609375, -19.61865234375, -18.757080078125, -17.8955078125, -17.033935546875, -16.17236328125, -15.310791015625, -14.44921875, -13.587646484375, -12.72607421875, -11.864501953125, -11.0029296875, -10.141357421875, -9.27978515625, -8.418212890625, -7.556640625, -6.695068359375, -5.83349609375, -4.971923828125, -4.1103515625, -3.248779296875, -2.38720703125, -1.525634765625, -0.6640625, 0.197509765625, 1.05908203125, 1.920654296875, 2.7822265625, 3.643798828125, 4.50537109375, 5.366943359375, 6.228515625, 7.090087890625, 7.95166015625, 8.813232421875, 9.6748046875, 10.536376953125, 11.39794921875, 12.259521484375, 13.12109375, 13.982666015625, 14.84423828125, 15.705810546875, 16.5673828125, 17.428955078125, 18.29052734375, 19.152099609375, 20.013671875, 20.875244140625, 21.73681640625, 22.598388671875, 23.4599609375, 24.321533203125, 25.18310546875, 26.044677734375, 26.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 4.0, 9.0, 17.0, 19.0, 21.0, 31.0, 24.0, 29.0, 38.0, 35.0, 44.0, 36.0, 46.0, 67.0, 103.0, 1743.0, 264.0, 80.0, 59.0, 43.0, 46.0, 37.0, 35.0, 28.0, 28.0, 18.0, 23.0, 10.0, 15.0, 16.0, 9.0, 11.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.04638671875, -34.7490234375, -33.45166015625, -32.154296875, -30.85693359375, -29.5595703125, -28.26220703125, -26.96484375, -25.66748046875, -24.3701171875, -23.07275390625, -21.775390625, -20.47802734375, -19.1806640625, -17.88330078125, -16.5859375, -15.28857421875, -13.9912109375, -12.69384765625, -11.396484375, -10.09912109375, -8.8017578125, -7.50439453125, -6.20703125, -4.90966796875, -3.6123046875, -2.31494140625, -1.017578125, 0.27978515625, 1.5771484375, 2.87451171875, 4.171875, 5.46923828125, 6.7666015625, 8.06396484375, 9.361328125, 10.65869140625, 11.9560546875, 13.25341796875, 14.55078125, 15.84814453125, 17.1455078125, 18.44287109375, 19.740234375, 21.03759765625, 22.3349609375, 23.63232421875, 24.9296875, 26.22705078125, 27.5244140625, 28.82177734375, 30.119140625, 31.41650390625, 32.7138671875, 34.01123046875, 35.30859375, 36.60595703125, 37.9033203125, 39.20068359375, 40.498046875, 41.79541015625, 43.0927734375, 44.39013671875, 45.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 9.0, 14.0, 14.0, 22.0, 16.0, 29.0, 22.0, 47.0, 83.0, 103.0, 179.0, 376.0, 1167.0, 4473.0, 25157.0, 2948441.0, 149995.0, 11471.0, 2518.0, 724.0, 316.0, 149.0, 94.0, 56.0, 41.0, 40.0, 26.0, 29.0, 19.0, 10.0, 9.0, 8.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -78.5302734375, -76.060546875, -73.5908203125, -71.12109375, -68.6513671875, -66.181640625, -63.7119140625, -61.2421875, -58.7724609375, -56.302734375, -53.8330078125, -51.36328125, -48.8935546875, -46.423828125, -43.9541015625, -41.484375, -39.0146484375, -36.544921875, -34.0751953125, -31.60546875, -29.1357421875, -26.666015625, -24.1962890625, -21.7265625, -19.2568359375, -16.787109375, -14.3173828125, -11.84765625, -9.3779296875, -6.908203125, -4.4384765625, -1.96875, 0.5009765625, 2.970703125, 5.4404296875, 7.91015625, 10.3798828125, 12.849609375, 15.3193359375, 17.7890625, 20.2587890625, 22.728515625, 25.1982421875, 27.66796875, 30.1376953125, 32.607421875, 35.0771484375, 37.546875, 40.0166015625, 42.486328125, 44.9560546875, 47.42578125, 49.8955078125, 52.365234375, 54.8349609375, 57.3046875, 59.7744140625, 62.244140625, 64.7138671875, 67.18359375, 69.6533203125, 72.123046875, 74.5927734375, 77.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 13.0, 59.0, 187.0, 363.0, 280.0, 71.0, 30.0, 6.0, 0.0, 2.0], "bins": [-248.97499084472656, -244.65927124023438, -240.34356689453125, -236.02784729003906, -231.71212768554688, -227.3964080810547, -223.0806884765625, -218.76498413085938, -214.4492645263672, -210.133544921875, -205.81784057617188, -201.5021209716797, -197.1864013671875, -192.8706817626953, -188.55496215820312, -184.2392578125, -179.9235382080078, -175.60781860351562, -171.2921142578125, -166.9763946533203, -162.66067504882812, -158.34495544433594, -154.02923583984375, -149.71353149414062, -145.39781188964844, -141.08209228515625, -136.76638793945312, -132.45066833496094, -128.13494873046875, -123.81922912597656, -119.5035171508789, -115.18780517578125, -110.87207794189453, -106.55636596679688, -102.24064636230469, -97.9249267578125, -93.60921478271484, -89.29350280761719, -84.977783203125, -80.66206359863281, -76.34635162353516, -72.0306396484375, -67.71492004394531, -63.39920425415039, -59.08348846435547, -54.76777267456055, -50.452056884765625, -46.1363410949707, -41.82062530517578, -37.50490951538086, -33.18919372558594, -28.873477935791016, -24.557762145996094, -20.242046356201172, -15.92633056640625, -11.610614776611328, -7.294897079467773, -2.9791812896728516, 1.3365345001220703, 5.652250289916992, 9.967966079711914, 14.283681869506836, 18.599397659301758, 22.91511344909668, 27.2308292388916]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 10.0, 7.0, 9.0, 19.0, 20.0, 27.0, 21.0, 34.0, 23.0, 26.0, 34.0, 30.0, 26.0, 34.0, 33.0, 34.0, 21.0, 40.0, 46.0, 32.0, 42.0, 37.0, 39.0, 37.0, 42.0, 20.0, 37.0, 20.0, 22.0, 13.0, 25.0, 22.0, 19.0, 19.0, 8.0, 8.0, 7.0, 12.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.50756072998047, -92.47132110595703, -89.43508911132812, -86.39884948730469, -83.36260986328125, -80.32637786865234, -77.2901382446289, -74.25390625, -71.21766662597656, -68.18142700195312, -65.14519500732422, -62.10895538330078, -59.07271957397461, -56.03648376464844, -53.000244140625, -49.96400833129883, -46.927772521972656, -43.891536712646484, -40.85530090332031, -37.819061279296875, -34.7828254699707, -31.74658966064453, -28.710351943969727, -25.674114227294922, -22.63787841796875, -19.601642608642578, -16.565404891967773, -13.529168128967285, -10.492931365966797, -7.456694602966309, -4.42045783996582, -1.3842201232910156, 1.6520156860351562, 4.6882524490356445, 7.724489212036133, 10.760725975036621, 13.79696273803711, 16.83319854736328, 19.869436264038086, 22.90567398071289, 25.941909790039062, 28.978145599365234, 32.014381408691406, 35.050621032714844, 38.086856842041016, 41.12309265136719, 44.159332275390625, 47.1955680847168, 50.23180389404297, 53.26803970336914, 56.30427551269531, 59.34051513671875, 62.37675094604492, 65.4129867553711, 68.44922637939453, 71.48545837402344, 74.52169799804688, 77.55793762207031, 80.59416961669922, 83.63040924072266, 86.66664123535156, 89.702880859375, 92.73912048339844, 95.77536010742188, 98.81159210205078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 7.0, 5.0, 15.0, 14.0, 13.0, 17.0, 20.0, 21.0, 23.0, 25.0, 33.0, 36.0, 43.0, 36.0, 44.0, 39.0, 39.0, 50.0, 43.0, 35.0, 47.0, 31.0, 46.0, 28.0, 34.0, 23.0, 26.0, 30.0, 28.0, 19.0, 16.0, 21.0, 12.0, 12.0, 17.0, 5.0, 5.0, 1.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.5625, -15.1065673828125, -14.650634765625, -14.1947021484375, -13.73876953125, -13.2828369140625, -12.826904296875, -12.3709716796875, -11.9150390625, -11.4591064453125, -11.003173828125, -10.5472412109375, -10.09130859375, -9.6353759765625, -9.179443359375, -8.7235107421875, -8.267578125, -7.8116455078125, -7.355712890625, -6.8997802734375, -6.44384765625, -5.9879150390625, -5.531982421875, -5.0760498046875, -4.6201171875, -4.1641845703125, -3.708251953125, -3.2523193359375, -2.79638671875, -2.3404541015625, -1.884521484375, -1.4285888671875, -0.97265625, -0.5167236328125, -0.060791015625, 0.3951416015625, 0.85107421875, 1.3070068359375, 1.762939453125, 2.2188720703125, 2.6748046875, 3.1307373046875, 3.586669921875, 4.0426025390625, 4.49853515625, 4.9544677734375, 5.410400390625, 5.8663330078125, 6.322265625, 6.7781982421875, 7.234130859375, 7.6900634765625, 8.14599609375, 8.6019287109375, 9.057861328125, 9.5137939453125, 9.9697265625, 10.4256591796875, 10.881591796875, 11.3375244140625, 11.79345703125, 12.2493896484375, 12.705322265625, 13.1612548828125, 13.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 11.0, 25.0, 23.0, 56.0, 88.0, 106.0, 184.0, 233.0, 360.0, 572.0, 912.0, 1450.0, 2511.0, 4019.0, 7185.0, 13519.0, 28219.0, 84484.0, 560835.0, 2619622.0, 704915.0, 100268.0, 31359.0, 14406.0, 7567.0, 4508.0, 2574.0, 1593.0, 988.0, 589.0, 365.0, 250.0, 145.0, 102.0, 59.0, 45.0, 32.0, 24.0, 10.0, 10.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.65625, -26.83203125, -26.0078125, -25.18359375, -24.359375, -23.53515625, -22.7109375, -21.88671875, -21.0625, -20.23828125, -19.4140625, -18.58984375, -17.765625, -16.94140625, -16.1171875, -15.29296875, -14.46875, -13.64453125, -12.8203125, -11.99609375, -11.171875, -10.34765625, -9.5234375, -8.69921875, -7.875, -7.05078125, -6.2265625, -5.40234375, -4.578125, -3.75390625, -2.9296875, -2.10546875, -1.28125, -0.45703125, 0.3671875, 1.19140625, 2.015625, 2.83984375, 3.6640625, 4.48828125, 5.3125, 6.13671875, 6.9609375, 7.78515625, 8.609375, 9.43359375, 10.2578125, 11.08203125, 11.90625, 12.73046875, 13.5546875, 14.37890625, 15.203125, 16.02734375, 16.8515625, 17.67578125, 18.5, 19.32421875, 20.1484375, 20.97265625, 21.796875, 22.62109375, 23.4453125, 24.26953125, 25.09375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 11.0, 10.0, 14.0, 10.0, 16.0, 26.0, 46.0, 50.0, 76.0, 124.0, 160.0, 316.0, 633.0, 957.0, 694.0, 372.0, 176.0, 109.0, 80.0, 55.0, 40.0, 20.0, 21.0, 14.0, 19.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.98876953125, -34.9775390625, -33.96630859375, -32.955078125, -31.94384765625, -30.9326171875, -29.92138671875, -28.91015625, -27.89892578125, -26.8876953125, -25.87646484375, -24.865234375, -23.85400390625, -22.8427734375, -21.83154296875, -20.8203125, -19.80908203125, -18.7978515625, -17.78662109375, -16.775390625, -15.76416015625, -14.7529296875, -13.74169921875, -12.73046875, -11.71923828125, -10.7080078125, -9.69677734375, -8.685546875, -7.67431640625, -6.6630859375, -5.65185546875, -4.640625, -3.62939453125, -2.6181640625, -1.60693359375, -0.595703125, 0.41552734375, 1.4267578125, 2.43798828125, 3.44921875, 4.46044921875, 5.4716796875, 6.48291015625, 7.494140625, 8.50537109375, 9.5166015625, 10.52783203125, 11.5390625, 12.55029296875, 13.5615234375, 14.57275390625, 15.583984375, 16.59521484375, 17.6064453125, 18.61767578125, 19.62890625, 20.64013671875, 21.6513671875, 22.66259765625, 23.673828125, 24.68505859375, 25.6962890625, 26.70751953125, 27.71875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 13.0, 16.0, 19.0, 19.0, 35.0, 58.0, 103.0, 171.0, 317.0, 790.0, 2730.0, 13124.0, 99106.0, 3537007.0, 497216.0, 35176.0, 5812.0, 1429.0, 522.0, 244.0, 134.0, 91.0, 43.0, 26.0, 20.0, 14.0, 16.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.4375, -62.9921875, -60.546875, -58.1015625, -55.65625, -53.2109375, -50.765625, -48.3203125, -45.875, -43.4296875, -40.984375, -38.5390625, -36.09375, -33.6484375, -31.203125, -28.7578125, -26.3125, -23.8671875, -21.421875, -18.9765625, -16.53125, -14.0859375, -11.640625, -9.1953125, -6.75, -4.3046875, -1.859375, 0.5859375, 3.03125, 5.4765625, 7.921875, 10.3671875, 12.8125, 15.2578125, 17.703125, 20.1484375, 22.59375, 25.0390625, 27.484375, 29.9296875, 32.375, 34.8203125, 37.265625, 39.7109375, 42.15625, 44.6015625, 47.046875, 49.4921875, 51.9375, 54.3828125, 56.828125, 59.2734375, 61.71875, 64.1640625, 66.609375, 69.0546875, 71.5, 73.9453125, 76.390625, 78.8359375, 81.28125, 83.7265625, 86.171875, 88.6171875, 91.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 32.0, 64.0, 168.0, 274.0, 247.0, 149.0, 43.0, 20.0, 8.0, 1.0], "bins": [-459.6931457519531, -451.7401428222656, -443.7871398925781, -435.8341064453125, -427.881103515625, -419.9281005859375, -411.97509765625, -404.0220947265625, -396.0690612792969, -388.1160583496094, -380.1630554199219, -372.21002197265625, -364.25701904296875, -356.30401611328125, -348.35101318359375, -340.39801025390625, -332.44500732421875, -324.49200439453125, -316.53900146484375, -308.5859680175781, -300.6329650878906, -292.6799621582031, -284.7269592285156, -276.7739562988281, -268.8209228515625, -260.867919921875, -252.91490173339844, -244.96189880371094, -237.00888061523438, -229.05587768554688, -221.10287475585938, -213.1498565673828, -205.1968536376953, -197.2438507080078, -189.29083251953125, -181.33782958984375, -173.3848114013672, -165.4318084716797, -157.47879028320312, -149.52578735351562, -141.57278442382812, -133.61978149414062, -125.66676330566406, -117.71376037597656, -109.76074981689453, -101.8077392578125, -93.85472869873047, -85.90171813964844, -77.9487075805664, -69.99569702148438, -62.04269027709961, -54.08967971801758, -46.13667297363281, -38.18366241455078, -30.23065185546875, -22.277645111083984, -14.324634552001953, -6.3716254234313965, 1.5813837051391602, 9.534393310546875, 17.487401962280273, 25.440410614013672, 33.3934211730957, 41.34642791748047, 49.2994384765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 5.0, 7.0, 6.0, 15.0, 16.0, 8.0, 14.0, 17.0, 12.0, 25.0, 19.0, 20.0, 27.0, 36.0, 27.0, 44.0, 44.0, 36.0, 29.0, 35.0, 35.0, 45.0, 42.0, 37.0, 36.0, 37.0, 39.0, 27.0, 34.0, 36.0, 19.0, 21.0, 24.0, 23.0, 17.0, 10.0, 9.0, 15.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.98035430908203, -59.78236389160156, -57.58437728881836, -55.386390686035156, -53.18840026855469, -50.99040985107422, -48.792423248291016, -46.59443664550781, -44.396446228027344, -42.198455810546875, -40.00046920776367, -37.80248260498047, -35.6044921875, -33.40650177001953, -31.208515167236328, -29.010526657104492, -26.812538146972656, -24.61454963684082, -22.416561126708984, -20.21857261657715, -18.020584106445312, -15.822595596313477, -13.62460708618164, -11.426618576049805, -9.228630065917969, -7.030641555786133, -4.832653045654297, -2.634664535522461, -0.436676025390625, 1.761312484741211, 3.959300994873047, 6.157289505004883, 8.355270385742188, 10.553258895874023, 12.75124740600586, 14.949235916137695, 17.14722442626953, 19.345212936401367, 21.543201446533203, 23.74118995666504, 25.939178466796875, 28.13716697692871, 30.335155487060547, 32.53314208984375, 34.73113250732422, 36.92912292480469, 39.12710952758789, 41.325096130371094, 43.52308654785156, 45.72107696533203, 47.919063568115234, 50.11705017089844, 52.315040588378906, 54.513031005859375, 56.71101760864258, 58.90900421142578, 61.10699462890625, 63.30498504638672, 65.50297546386719, 67.70095825195312, 69.8989486694336, 72.09693908691406, 74.294921875, 76.49291229248047, 78.69090270996094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 11.0, 14.0, 18.0, 30.0, 41.0, 62.0, 115.0, 124.0, 197.0, 306.0, 438.0, 763.0, 1102.0, 1712.0, 2750.0, 4217.0, 6936.0, 11561.0, 19547.0, 32750.0, 55292.0, 94128.0, 163121.0, 242546.0, 169810.0, 98035.0, 57296.0, 33903.0, 20146.0, 11893.0, 7337.0, 4472.0, 2816.0, 1733.0, 1166.0, 754.0, 473.0, 297.0, 202.0, 148.0, 104.0, 63.0, 37.0, 40.0, 17.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3288307189941406, -0.31806182861328125, -0.3072929382324219, -0.2965240478515625, -0.2857551574707031, -0.27498626708984375, -0.2642173767089844, -0.253448486328125, -0.24267959594726562, -0.23191070556640625, -0.22114181518554688, -0.2103729248046875, -0.19960403442382812, -0.18883514404296875, -0.17806625366210938, -0.16729736328125, -0.15652847290039062, -0.14575958251953125, -0.13499069213867188, -0.1242218017578125, -0.11345291137695312, -0.10268402099609375, -0.09191513061523438, -0.081146240234375, -0.07037734985351562, -0.05960845947265625, -0.048839569091796875, -0.0380706787109375, -0.027301788330078125, -0.01653289794921875, -0.005764007568359375, 0.0050048828125, 0.015773773193359375, 0.02654266357421875, 0.037311553955078125, 0.0480804443359375, 0.058849334716796875, 0.06961822509765625, 0.08038711547851562, 0.091156005859375, 0.10192489624023438, 0.11269378662109375, 0.12346267700195312, 0.1342315673828125, 0.14500045776367188, 0.15576934814453125, 0.16653823852539062, 0.17730712890625, 0.18807601928710938, 0.19884490966796875, 0.20961380004882812, 0.2203826904296875, 0.23115158081054688, 0.24192047119140625, 0.2526893615722656, 0.263458251953125, 0.2742271423339844, 0.28499603271484375, 0.2957649230957031, 0.3065338134765625, 0.3173027038574219, 0.32807159423828125, 0.3388404846191406, 0.349609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 10.0, 11.0, 7.0, 8.0, 17.0, 18.0, 19.0, 18.0, 24.0, 24.0, 30.0, 25.0, 41.0, 41.0, 33.0, 45.0, 48.0, 41.0, 38.0, 1072.0, 37.0, 33.0, 30.0, 36.0, 44.0, 35.0, 39.0, 22.0, 25.0, 13.0, 16.0, 19.0, 18.0, 15.0, 16.0, 13.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.859375, -9.533447265625, -9.20751953125, -8.881591796875, -8.5556640625, -8.229736328125, -7.90380859375, -7.577880859375, -7.251953125, -6.926025390625, -6.60009765625, -6.274169921875, -5.9482421875, -5.622314453125, -5.29638671875, -4.970458984375, -4.64453125, -4.318603515625, -3.99267578125, -3.666748046875, -3.3408203125, -3.014892578125, -2.68896484375, -2.363037109375, -2.037109375, -1.711181640625, -1.38525390625, -1.059326171875, -0.7333984375, -0.407470703125, -0.08154296875, 0.244384765625, 0.5703125, 0.896240234375, 1.22216796875, 1.548095703125, 1.8740234375, 2.199951171875, 2.52587890625, 2.851806640625, 3.177734375, 3.503662109375, 3.82958984375, 4.155517578125, 4.4814453125, 4.807373046875, 5.13330078125, 5.459228515625, 5.78515625, 6.111083984375, 6.43701171875, 6.762939453125, 7.0888671875, 7.414794921875, 7.74072265625, 8.066650390625, 8.392578125, 8.718505859375, 9.04443359375, 9.370361328125, 9.6962890625, 10.022216796875, 10.34814453125, 10.674072265625, 11.0]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 5.0, 13.0, 13.0, 21.0, 44.0, 60.0, 77.0, 101.0, 141.0, 238.0, 289.0, 391.0, 609.0, 824.0, 1074.0, 1643.0, 2182.0, 3242.0, 4465.0, 6428.0, 9313.0, 13572.0, 20327.0, 30282.0, 46080.0, 70816.0, 112494.0, 178663.0, 1238250.0, 123815.0, 77883.0, 50114.0, 33284.0, 22322.0, 14934.0, 9996.0, 6986.0, 4788.0, 3273.0, 2278.0, 1626.0, 1162.0, 900.0, 608.0, 423.0, 325.0, 219.0, 165.0, 107.0, 98.0, 52.0, 43.0, 22.0, 20.0, 14.0, 11.0, 5.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.143310546875, -0.138702392578125, -0.13409423828125, -0.129486083984375, -0.1248779296875, -0.120269775390625, -0.11566162109375, -0.111053466796875, -0.1064453125, -0.101837158203125, -0.09722900390625, -0.092620849609375, -0.0880126953125, -0.083404541015625, -0.07879638671875, -0.074188232421875, -0.069580078125, -0.064971923828125, -0.06036376953125, -0.055755615234375, -0.0511474609375, -0.046539306640625, -0.04193115234375, -0.037322998046875, -0.03271484375, -0.028106689453125, -0.02349853515625, -0.018890380859375, -0.0142822265625, -0.009674072265625, -0.00506591796875, -0.000457763671875, 0.004150390625, 0.008758544921875, 0.01336669921875, 0.017974853515625, 0.0225830078125, 0.027191162109375, 0.03179931640625, 0.036407470703125, 0.041015625, 0.045623779296875, 0.05023193359375, 0.054840087890625, 0.0594482421875, 0.064056396484375, 0.06866455078125, 0.073272705078125, 0.077880859375, 0.082489013671875, 0.08709716796875, 0.091705322265625, 0.0963134765625, 0.100921630859375, 0.10552978515625, 0.110137939453125, 0.11474609375, 0.119354248046875, 0.12396240234375, 0.128570556640625, 0.1331787109375, 0.137786865234375, 0.14239501953125, 0.147003173828125, 0.151611328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 9.0, 4.0, 5.0, 11.0, 17.0, 13.0, 14.0, 13.0, 20.0, 27.0, 34.0, 43.0, 49.0, 50.0, 55.0, 60.0, 70.0, 66.0, 52.0, 66.0, 48.0, 51.0, 35.0, 36.0, 27.0, 25.0, 21.0, 18.0, 6.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005297660827636719, -0.0005147233605384827, -0.0004996806383132935, -0.00048463791608810425, -0.00046959519386291504, -0.00045455247163772583, -0.0004395097494125366, -0.0004244670271873474, -0.0004094243049621582, -0.000394381582736969, -0.0003793388605117798, -0.0003642961382865906, -0.00034925341606140137, -0.00033421069383621216, -0.00031916797161102295, -0.00030412524938583374, -0.00028908252716064453, -0.0002740398049354553, -0.0002589970827102661, -0.0002439543604850769, -0.0002289116382598877, -0.00021386891603469849, -0.00019882619380950928, -0.00018378347158432007, -0.00016874074935913086, -0.00015369802713394165, -0.00013865530490875244, -0.00012361258268356323, -0.00010856986045837402, -9.352713823318481e-05, -7.84844160079956e-05, -6.34416937828064e-05, -4.839897155761719e-05, -3.335624933242798e-05, -1.831352710723877e-05, -3.2708048820495605e-06, 1.1771917343139648e-05, 2.6814639568328857e-05, 4.1857361793518066e-05, 5.6900084018707275e-05, 7.194280624389648e-05, 8.69855284690857e-05, 0.0001020282506942749, 0.00011707097291946411, 0.00013211369514465332, 0.00014715641736984253, 0.00016219913959503174, 0.00017724186182022095, 0.00019228458404541016, 0.00020732730627059937, 0.00022237002849578857, 0.00023741275072097778, 0.000252455472946167, 0.0002674981951713562, 0.0002825409173965454, 0.0002975836396217346, 0.00031262636184692383, 0.00032766908407211304, 0.00034271180629730225, 0.00035775452852249146, 0.00037279725074768066, 0.0003878399729728699, 0.0004028826951980591, 0.0004179254174232483, 0.0004329681396484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 3.0, 7.0, 9.0, 13.0, 9.0, 21.0, 27.0, 28.0, 34.0, 61.0, 65.0, 125.0, 209.0, 420.0, 1800.0, 981799.0, 62103.0, 870.0, 349.0, 175.0, 100.0, 77.0, 51.0, 45.0, 26.0, 19.0, 14.0, 16.0, 19.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.00938260555267334, -0.00904536247253418, -0.00870811939239502, -0.00837087631225586, -0.0080336332321167, -0.007696390151977539, -0.007359147071838379, -0.007021903991699219, -0.006684660911560059, -0.0063474178314208984, -0.006010174751281738, -0.005672931671142578, -0.005335688591003418, -0.004998445510864258, -0.004661202430725098, -0.0043239593505859375, -0.003986716270446777, -0.003649473190307617, -0.003312230110168457, -0.002974987030029297, -0.0026377439498901367, -0.0023005008697509766, -0.0019632577896118164, -0.0016260147094726562, -0.001288771629333496, -0.0009515285491943359, -0.0006142854690551758, -0.0002770423889160156, 6.020069122314453e-05, 0.0003974437713623047, 0.0007346868515014648, 0.001071929931640625, 0.0014091730117797852, 0.0017464160919189453, 0.0020836591720581055, 0.0024209022521972656, 0.0027581453323364258, 0.003095388412475586, 0.003432631492614746, 0.0037698745727539062, 0.004107117652893066, 0.0044443607330322266, 0.004781603813171387, 0.005118846893310547, 0.005456089973449707, 0.005793333053588867, 0.006130576133728027, 0.0064678192138671875, 0.006805062294006348, 0.007142305374145508, 0.007479548454284668, 0.007816791534423828, 0.008154034614562988, 0.008491277694702148, 0.008828520774841309, 0.009165763854980469, 0.009503006935119629, 0.009840250015258789, 0.01017749309539795, 0.01051473617553711, 0.01085197925567627, 0.01118922233581543, 0.01152646541595459, 0.01186370849609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 912.0, 88.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028254054486751556, -0.0027009393088519573, -0.0025764729361981153, -0.002452006796374917, -0.0023275406565517187, -0.0022030742838978767, -0.0020786081440746784, -0.00195414200425148, -0.00182967574801296, -0.0017052094917744398, -0.0015807433519512415, -0.0014562770957127213, -0.0013318108394742012, -0.0012073446996510029, -0.0010828784434124827, -0.0009584122453816235, -0.0008339460473507643, -0.000709479849319905, -0.0005850136512890458, -0.00046054739505052567, -0.00033608119701966643, -0.0002116149989888072, -8.714874275028706e-05, 3.7317455280572176e-05, 0.0001617836533114314, 0.00028624985134229064, 0.00041071607847698033, 0.00053518230561167, 0.0006596485036425292, 0.0007841147016733885, 0.0009085809579119086, 0.0010330472141504288, 0.001157513353973627, 0.0012819796102121472, 0.0014064457500353456, 0.0015309120062738657, 0.001655378146097064, 0.0017798444023355842, 0.0019043106585741043, 0.0020287767983973026, 0.002153242938220501, 0.0022777090780436993, 0.0024021754506975412, 0.0025266415905207396, 0.002651107730343938, 0.00277557410299778, 0.002900040242820978, 0.0030245063826441765, 0.0031489727552980185, 0.0032734388951212168, 0.0033979052677750587, 0.003522371407598257, 0.0036468375474214554, 0.0037713036872446537, 0.0038957700598984957, 0.004020236432552338, 0.004144702572375536, 0.004269168712198734, 0.004393634852021933, 0.004518100991845131, 0.0046425675973296165, 0.004767033737152815, 0.004891499876976013, 0.0050159660167992115, 0.00514043215662241]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 25.0, 27.0, 47.0, 45.0, 91.0, 110.0, 95.0, 119.0, 111.0, 108.0, 58.0, 72.0, 36.0, 25.0, 16.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000614464282989502, -0.0005881385877728462, -0.0005618128925561905, -0.0005354871973395348, -0.000509161502122879, -0.0004828358069062233, -0.00045651011168956757, -0.00043018441647291183, -0.0004038587212562561, -0.00037753302603960037, -0.00035120733082294464, -0.0003248816356062889, -0.0002985559403896332, -0.00027223024517297745, -0.0002459045499563217, -0.00021957885473966599, -0.00019325315952301025, -0.00016692746430635452, -0.0001406017690896988, -0.00011427607387304306, -8.795037865638733e-05, -6.16246834397316e-05, -3.529898822307587e-05, -8.973293006420135e-06, 1.7352402210235596e-05, 4.367809742689133e-05, 7.000379264354706e-05, 9.632948786020279e-05, 0.00012265518307685852, 0.00014898087829351425, 0.00017530657351016998, 0.00020163226872682571, 0.00022795796394348145, 0.0002542836591601372, 0.0002806093543767929, 0.00030693504959344864, 0.00033326074481010437, 0.0003595864400267601, 0.00038591213524341583, 0.00041223783046007156, 0.0004385635256767273, 0.000464889220893383, 0.0004912149161100388, 0.0005175406113266945, 0.0005438663065433502, 0.000570192001760006, 0.0005965176969766617, 0.0006228433921933174, 0.0006491690874099731, 0.0006754947826266289, 0.0007018204778432846, 0.0007281461730599403, 0.0007544718682765961, 0.0007807975634932518, 0.0008071232587099075, 0.0008334489539265633, 0.000859774649143219, 0.0008861003443598747, 0.0009124260395765305, 0.0009387517347931862, 0.0009650774300098419, 0.0009914031252264977, 0.0010177288204431534, 0.0010440545156598091, 0.0010703802108764648]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 26.0, 26.0, 39.0, 60.0, 87.0, 112.0, 183.0, 286.0, 442.0, 713.0, 1110.0, 1725.0, 2808.0, 4499.0, 7322.0, 12758.0, 22015.0, 39626.0, 77505.0, 212852.0, 411952.0, 123761.0, 55892.0, 30201.0, 16921.0, 9912.0, 5858.0, 3646.0, 2276.0, 1395.0, 858.0, 539.0, 381.0, 256.0, 147.0, 110.0, 87.0, 44.0, 29.0, 26.0, 12.0, 16.0, 7.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.049072265625, -17.41064453125, -16.772216796875, -16.1337890625, -15.495361328125, -14.85693359375, -14.218505859375, -13.580078125, -12.941650390625, -12.30322265625, -11.664794921875, -11.0263671875, -10.387939453125, -9.74951171875, -9.111083984375, -8.47265625, -7.834228515625, -7.19580078125, -6.557373046875, -5.9189453125, -5.280517578125, -4.64208984375, -4.003662109375, -3.365234375, -2.726806640625, -2.08837890625, -1.449951171875, -0.8115234375, -0.173095703125, 0.46533203125, 1.103759765625, 1.7421875, 2.380615234375, 3.01904296875, 3.657470703125, 4.2958984375, 4.934326171875, 5.57275390625, 6.211181640625, 6.849609375, 7.488037109375, 8.12646484375, 8.764892578125, 9.4033203125, 10.041748046875, 10.68017578125, 11.318603515625, 11.95703125, 12.595458984375, 13.23388671875, 13.872314453125, 14.5107421875, 15.149169921875, 15.78759765625, 16.426025390625, 17.064453125, 17.702880859375, 18.34130859375, 18.979736328125, 19.6181640625, 20.256591796875, 20.89501953125, 21.533447265625, 22.171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 14.0, 4.0, 9.0, 6.0, 8.0, 11.0, 11.0, 17.0, 20.0, 23.0, 29.0, 28.0, 38.0, 25.0, 30.0, 44.0, 50.0, 90.0, 110.0, 225.0, 1526.0, 184.0, 95.0, 70.0, 41.0, 42.0, 42.0, 36.0, 33.0, 24.0, 23.0, 16.0, 23.0, 22.0, 22.0, 11.0, 8.0, 10.0, 8.0, 9.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53125, -37.34033203125, -36.1494140625, -34.95849609375, -33.767578125, -32.57666015625, -31.3857421875, -30.19482421875, -29.00390625, -27.81298828125, -26.6220703125, -25.43115234375, -24.240234375, -23.04931640625, -21.8583984375, -20.66748046875, -19.4765625, -18.28564453125, -17.0947265625, -15.90380859375, -14.712890625, -13.52197265625, -12.3310546875, -11.14013671875, -9.94921875, -8.75830078125, -7.5673828125, -6.37646484375, -5.185546875, -3.99462890625, -2.8037109375, -1.61279296875, -0.421875, 0.76904296875, 1.9599609375, 3.15087890625, 4.341796875, 5.53271484375, 6.7236328125, 7.91455078125, 9.10546875, 10.29638671875, 11.4873046875, 12.67822265625, 13.869140625, 15.06005859375, 16.2509765625, 17.44189453125, 18.6328125, 19.82373046875, 21.0146484375, 22.20556640625, 23.396484375, 24.58740234375, 25.7783203125, 26.96923828125, 28.16015625, 29.35107421875, 30.5419921875, 31.73291015625, 32.923828125, 34.11474609375, 35.3056640625, 36.49658203125, 37.6875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 7.0, 7.0, 13.0, 14.0, 21.0, 35.0, 47.0, 50.0, 92.0, 114.0, 199.0, 436.0, 932.0, 2114.0, 5822.0, 17492.0, 64994.0, 479842.0, 2391760.0, 135233.0, 30905.0, 9548.0, 3353.0, 1312.0, 604.0, 268.0, 157.0, 100.0, 57.0, 40.0, 34.0, 21.0, 22.0, 7.0, 15.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-46.0625, -44.716796875, -43.37109375, -42.025390625, -40.6796875, -39.333984375, -37.98828125, -36.642578125, -35.296875, -33.951171875, -32.60546875, -31.259765625, -29.9140625, -28.568359375, -27.22265625, -25.876953125, -24.53125, -23.185546875, -21.83984375, -20.494140625, -19.1484375, -17.802734375, -16.45703125, -15.111328125, -13.765625, -12.419921875, -11.07421875, -9.728515625, -8.3828125, -7.037109375, -5.69140625, -4.345703125, -3.0, -1.654296875, -0.30859375, 1.037109375, 2.3828125, 3.728515625, 5.07421875, 6.419921875, 7.765625, 9.111328125, 10.45703125, 11.802734375, 13.1484375, 14.494140625, 15.83984375, 17.185546875, 18.53125, 19.876953125, 21.22265625, 22.568359375, 23.9140625, 25.259765625, 26.60546875, 27.951171875, 29.296875, 30.642578125, 31.98828125, 33.333984375, 34.6796875, 36.025390625, 37.37109375, 38.716796875, 40.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 10.0, 37.0, 117.0, 233.0, 297.0, 210.0, 69.0, 29.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21734619140625, -40.668174743652344, -35.11900329589844, -29.569833755493164, -24.020662307739258, -18.47149085998535, -12.922321319580078, -7.373149871826172, -1.8239784240722656, 3.7251925468444824, 9.27436351776123, 14.82353401184082, 20.372705459594727, 25.921876907348633, 31.471046447753906, 37.02021789550781, 42.56938934326172, 48.118560791015625, 53.66773223876953, 59.21690368652344, 64.76607513427734, 70.31524658203125, 75.86441040039062, 81.41358947753906, 86.96275329589844, 92.51192474365234, 98.06109619140625, 103.61026763916016, 109.15943908691406, 114.70861053466797, 120.25778198242188, 125.80694580078125, 131.3561248779297, 136.90528869628906, 142.4544677734375, 148.00363159179688, 153.5528106689453, 159.1019744873047, 164.65115356445312, 170.2003173828125, 175.74949645996094, 181.2986602783203, 186.84783935546875, 192.39700317382812, 197.94618225097656, 203.49534606933594, 209.04452514648438, 214.59368896484375, 220.14285278320312, 225.6920166015625, 231.24119567871094, 236.7903594970703, 242.33953857421875, 247.88870239257812, 253.43788146972656, 258.987060546875, 264.5362243652344, 270.08538818359375, 275.6345520019531, 281.1837463378906, 286.73291015625, 292.2820739746094, 297.83123779296875, 303.38043212890625, 308.9295959472656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 9.0, 4.0, 13.0, 11.0, 13.0, 14.0, 20.0, 19.0, 21.0, 20.0, 26.0, 27.0, 36.0, 26.0, 28.0, 41.0, 42.0, 39.0, 40.0, 39.0, 40.0, 38.0, 40.0, 44.0, 39.0, 37.0, 39.0, 34.0, 27.0, 25.0, 19.0, 13.0, 23.0, 12.0, 11.0, 10.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-83.2530746459961, -80.60598754882812, -77.95890045166016, -75.31180572509766, -72.66471862792969, -70.01763153076172, -67.37054443359375, -64.72345733642578, -62.07636642456055, -59.42927932739258, -56.782188415527344, -54.135101318359375, -51.488014221191406, -48.84092330932617, -46.1938362121582, -43.54674530029297, -40.899658203125, -38.25257110595703, -35.6054801940918, -32.95839309692383, -30.311304092407227, -27.664215087890625, -25.017127990722656, -22.370038986206055, -19.722949981689453, -17.07586097717285, -14.428772926330566, -11.781684875488281, -9.13459587097168, -6.487506866455078, -3.840418815612793, -1.1933307647705078, 1.4537506103515625, 4.100839138031006, 6.747927665710449, 9.395015716552734, 12.042104721069336, 14.689193725585938, 17.336280822753906, 19.983369827270508, 22.63045883178711, 25.27754783630371, 27.924636840820312, 30.57172393798828, 33.21881103515625, 35.865901947021484, 38.51298904418945, 41.16007995605469, 43.807167053222656, 46.454254150390625, 49.10134506225586, 51.74843215942383, 54.39552307128906, 57.04261016845703, 59.689697265625, 62.33678436279297, 64.98387145996094, 67.6309585571289, 70.27804565429688, 72.92514038085938, 75.57222747802734, 78.21931457519531, 80.86640167236328, 83.51348876953125, 86.16058349609375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 7.0, 7.0, 9.0, 17.0, 15.0, 19.0, 23.0, 26.0, 38.0, 35.0, 34.0, 42.0, 48.0, 28.0, 48.0, 31.0, 46.0, 46.0, 42.0, 38.0, 41.0, 40.0, 34.0, 41.0, 25.0, 34.0, 37.0, 21.0, 22.0, 18.0, 18.0, 18.0, 12.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.46875, -16.945068359375, -16.42138671875, -15.897705078125, -15.3740234375, -14.850341796875, -14.32666015625, -13.802978515625, -13.279296875, -12.755615234375, -12.23193359375, -11.708251953125, -11.1845703125, -10.660888671875, -10.13720703125, -9.613525390625, -9.08984375, -8.566162109375, -8.04248046875, -7.518798828125, -6.9951171875, -6.471435546875, -5.94775390625, -5.424072265625, -4.900390625, -4.376708984375, -3.85302734375, -3.329345703125, -2.8056640625, -2.281982421875, -1.75830078125, -1.234619140625, -0.7109375, -0.187255859375, 0.33642578125, 0.860107421875, 1.3837890625, 1.907470703125, 2.43115234375, 2.954833984375, 3.478515625, 4.002197265625, 4.52587890625, 5.049560546875, 5.5732421875, 6.096923828125, 6.62060546875, 7.144287109375, 7.66796875, 8.191650390625, 8.71533203125, 9.239013671875, 9.7626953125, 10.286376953125, 10.81005859375, 11.333740234375, 11.857421875, 12.381103515625, 12.90478515625, 13.428466796875, 13.9521484375, 14.475830078125, 14.99951171875, 15.523193359375, 16.046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 7.0, 3.0, 6.0, 16.0, 14.0, 15.0, 31.0, 34.0, 52.0, 85.0, 94.0, 152.0, 227.0, 280.0, 475.0, 666.0, 974.0, 1382.0, 2244.0, 3529.0, 5793.0, 9683.0, 18152.0, 41369.0, 158389.0, 1085371.0, 2332195.0, 399417.0, 73431.0, 26566.0, 12915.0, 7614.0, 4514.0, 2865.0, 1859.0, 1236.0, 837.0, 584.0, 374.0, 261.0, 204.0, 98.0, 85.0, 59.0, 33.0, 25.0, 16.0, 21.0, 6.0, 11.0, 5.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.96484375, -22.1796875, -21.39453125, -20.609375, -19.82421875, -19.0390625, -18.25390625, -17.46875, -16.68359375, -15.8984375, -15.11328125, -14.328125, -13.54296875, -12.7578125, -11.97265625, -11.1875, -10.40234375, -9.6171875, -8.83203125, -8.046875, -7.26171875, -6.4765625, -5.69140625, -4.90625, -4.12109375, -3.3359375, -2.55078125, -1.765625, -0.98046875, -0.1953125, 0.58984375, 1.375, 2.16015625, 2.9453125, 3.73046875, 4.515625, 5.30078125, 6.0859375, 6.87109375, 7.65625, 8.44140625, 9.2265625, 10.01171875, 10.796875, 11.58203125, 12.3671875, 13.15234375, 13.9375, 14.72265625, 15.5078125, 16.29296875, 17.078125, 17.86328125, 18.6484375, 19.43359375, 20.21875, 21.00390625, 21.7890625, 22.57421875, 23.359375, 24.14453125, 24.9296875, 25.71484375, 26.5]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 11.0, 12.0, 11.0, 18.0, 16.0, 19.0, 29.0, 37.0, 45.0, 52.0, 71.0, 93.0, 158.0, 238.0, 476.0, 724.0, 734.0, 485.0, 273.0, 161.0, 97.0, 58.0, 43.0, 41.0, 29.0, 31.0, 14.0, 16.0, 8.0, 13.0, 6.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.59375, -26.8056640625, -26.017578125, -25.2294921875, -24.44140625, -23.6533203125, -22.865234375, -22.0771484375, -21.2890625, -20.5009765625, -19.712890625, -18.9248046875, -18.13671875, -17.3486328125, -16.560546875, -15.7724609375, -14.984375, -14.1962890625, -13.408203125, -12.6201171875, -11.83203125, -11.0439453125, -10.255859375, -9.4677734375, -8.6796875, -7.8916015625, -7.103515625, -6.3154296875, -5.52734375, -4.7392578125, -3.951171875, -3.1630859375, -2.375, -1.5869140625, -0.798828125, -0.0107421875, 0.77734375, 1.5654296875, 2.353515625, 3.1416015625, 3.9296875, 4.7177734375, 5.505859375, 6.2939453125, 7.08203125, 7.8701171875, 8.658203125, 9.4462890625, 10.234375, 11.0224609375, 11.810546875, 12.5986328125, 13.38671875, 14.1748046875, 14.962890625, 15.7509765625, 16.5390625, 17.3271484375, 18.115234375, 18.9033203125, 19.69140625, 20.4794921875, 21.267578125, 22.0556640625, 22.84375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 8.0, 12.0, 20.0, 19.0, 35.0, 54.0, 79.0, 98.0, 193.0, 336.0, 635.0, 1264.0, 2925.0, 6538.0, 16146.0, 47167.0, 193817.0, 2996149.0, 786148.0, 95417.0, 28165.0, 10486.0, 4446.0, 1969.0, 918.0, 500.0, 275.0, 141.0, 99.0, 65.0, 35.0, 35.0, 20.0, 13.0, 14.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-48.125, -46.7412109375, -45.357421875, -43.9736328125, -42.58984375, -41.2060546875, -39.822265625, -38.4384765625, -37.0546875, -35.6708984375, -34.287109375, -32.9033203125, -31.51953125, -30.1357421875, -28.751953125, -27.3681640625, -25.984375, -24.6005859375, -23.216796875, -21.8330078125, -20.44921875, -19.0654296875, -17.681640625, -16.2978515625, -14.9140625, -13.5302734375, -12.146484375, -10.7626953125, -9.37890625, -7.9951171875, -6.611328125, -5.2275390625, -3.84375, -2.4599609375, -1.076171875, 0.3076171875, 1.69140625, 3.0751953125, 4.458984375, 5.8427734375, 7.2265625, 8.6103515625, 9.994140625, 11.3779296875, 12.76171875, 14.1455078125, 15.529296875, 16.9130859375, 18.296875, 19.6806640625, 21.064453125, 22.4482421875, 23.83203125, 25.2158203125, 26.599609375, 27.9833984375, 29.3671875, 30.7509765625, 32.134765625, 33.5185546875, 34.90234375, 36.2861328125, 37.669921875, 39.0537109375, 40.4375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 46.0, 220.0, 510.0, 196.0, 34.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.16114807128906, -196.59690856933594, -182.0326690673828, -167.4684295654297, -152.90419006347656, -138.33995056152344, -123.77571105957031, -109.21147155761719, -94.64723205566406, -80.08299255371094, -65.51875305175781, -50.95451354980469, -36.39027404785156, -21.826034545898438, -7.2617950439453125, 7.3024444580078125, 21.866683959960938, 36.43092346191406, 50.99516296386719, 65.55940246582031, 80.12364196777344, 94.68788146972656, 109.25212097167969, 123.81636047363281, 138.38059997558594, 152.94483947753906, 167.5090789794922, 182.0733184814453, 196.63755798339844, 211.20179748535156, 225.7660369873047, 240.3302764892578, 254.89453125, 269.4587707519531, 284.02301025390625, 298.5872497558594, 313.1514892578125, 327.7157287597656, 342.27996826171875, 356.8442077636719, 371.408447265625, 385.9726867675781, 400.53692626953125, 415.1011657714844, 429.6654052734375, 444.2296447753906, 458.79388427734375, 473.3581237792969, 487.92236328125, 502.4866027832031, 517.0508422851562, 531.6151123046875, 546.1793212890625, 560.7435302734375, 575.3078002929688, 589.8720703125, 604.436279296875, 619.00048828125, 633.5647583007812, 648.1290283203125, 662.6932373046875, 677.2574462890625, 691.8217163085938, 706.385986328125, 720.9501953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 10.0, 9.0, 9.0, 19.0, 25.0, 16.0, 17.0, 22.0, 32.0, 30.0, 38.0, 32.0, 38.0, 38.0, 36.0, 33.0, 51.0, 45.0, 54.0, 55.0, 34.0, 32.0, 28.0, 26.0, 30.0, 29.0, 37.0, 29.0, 25.0, 19.0, 17.0, 15.0, 4.0, 6.0, 12.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.73143005371094, -70.1810302734375, -67.6306381225586, -65.08023834228516, -62.52984619140625, -59.97944641113281, -57.42905044555664, -54.87865447998047, -52.3282585144043, -49.777862548828125, -47.22746658325195, -44.67707061767578, -42.126670837402344, -39.57627868652344, -37.02587890625, -34.47548294067383, -31.925086975097656, -29.374691009521484, -26.824295043945312, -24.273897171020508, -21.723501205444336, -19.173105239868164, -16.62270736694336, -14.072311401367188, -11.521915435791016, -8.971519470214844, -6.4211225509643555, -3.8707261085510254, -1.3203296661376953, 1.2300662994384766, 3.780463218688965, 6.330860137939453, 8.881248474121094, 11.431644439697266, 13.982041358947754, 16.532438278198242, 19.082834243774414, 21.633230209350586, 24.18362808227539, 26.734024047851562, 29.284420013427734, 31.834815979003906, 34.38521194458008, 36.93560791015625, 39.48600769042969, 42.036399841308594, 44.58679962158203, 47.1371955871582, 49.687591552734375, 52.23798751831055, 54.78838348388672, 57.33877944946289, 59.88917541503906, 62.4395751953125, 64.9899673461914, 67.54036712646484, 70.09075927734375, 72.64115905761719, 75.1915512084961, 77.74195098876953, 80.29234313964844, 82.84274291992188, 85.39313507080078, 87.94353485107422, 90.49393463134766]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 21.0, 29.0, 39.0, 74.0, 100.0, 149.0, 211.0, 340.0, 492.0, 771.0, 1154.0, 1817.0, 2835.0, 4372.0, 6932.0, 11198.0, 17951.0, 29288.0, 47068.0, 76274.0, 123972.0, 214771.0, 201477.0, 117173.0, 71960.0, 44676.0, 27318.0, 17029.0, 10563.0, 6684.0, 4183.0, 2715.0, 1728.0, 1104.0, 712.0, 503.0, 291.0, 178.0, 154.0, 78.0, 42.0, 33.0, 27.0, 17.0, 9.0, 14.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.331787109375, -0.3213996887207031, -0.31101226806640625, -0.3006248474121094, -0.2902374267578125, -0.2798500061035156, -0.26946258544921875, -0.2590751647949219, -0.248687744140625, -0.23830032348632812, -0.22791290283203125, -0.21752548217773438, -0.2071380615234375, -0.19675064086914062, -0.18636322021484375, -0.17597579956054688, -0.16558837890625, -0.15520095825195312, -0.14481353759765625, -0.13442611694335938, -0.1240386962890625, -0.11365127563476562, -0.10326385498046875, -0.09287643432617188, -0.082489013671875, -0.07210159301757812, -0.06171417236328125, -0.051326751708984375, -0.0409393310546875, -0.030551910400390625, -0.02016448974609375, -0.009777069091796875, 0.0006103515625, 0.010997772216796875, 0.02138519287109375, 0.031772613525390625, 0.0421600341796875, 0.052547454833984375, 0.06293487548828125, 0.07332229614257812, 0.083709716796875, 0.09409713745117188, 0.10448455810546875, 0.11487197875976562, 0.1252593994140625, 0.13564682006835938, 0.14603424072265625, 0.15642166137695312, 0.16680908203125, 0.17719650268554688, 0.18758392333984375, 0.19797134399414062, 0.2083587646484375, 0.21874618530273438, 0.22913360595703125, 0.23952102661132812, 0.249908447265625, 0.2602958679199219, 0.27068328857421875, 0.2810707092285156, 0.2914581298828125, 0.3018455505371094, 0.31223297119140625, 0.3226203918457031, 0.3330078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 15.0, 10.0, 12.0, 17.0, 12.0, 19.0, 28.0, 24.0, 25.0, 33.0, 31.0, 39.0, 36.0, 40.0, 31.0, 46.0, 40.0, 1081.0, 39.0, 37.0, 45.0, 34.0, 26.0, 44.0, 35.0, 18.0, 32.0, 24.0, 28.0, 19.0, 16.0, 16.0, 10.0, 7.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2523193359375, -10.879638671875, -10.5069580078125, -10.13427734375, -9.7615966796875, -9.388916015625, -9.0162353515625, -8.6435546875, -8.2708740234375, -7.898193359375, -7.5255126953125, -7.15283203125, -6.7801513671875, -6.407470703125, -6.0347900390625, -5.662109375, -5.2894287109375, -4.916748046875, -4.5440673828125, -4.17138671875, -3.7987060546875, -3.426025390625, -3.0533447265625, -2.6806640625, -2.3079833984375, -1.935302734375, -1.5626220703125, -1.18994140625, -0.8172607421875, -0.444580078125, -0.0718994140625, 0.30078125, 0.6734619140625, 1.046142578125, 1.4188232421875, 1.79150390625, 2.1641845703125, 2.536865234375, 2.9095458984375, 3.2822265625, 3.6549072265625, 4.027587890625, 4.4002685546875, 4.77294921875, 5.1456298828125, 5.518310546875, 5.8909912109375, 6.263671875, 6.6363525390625, 7.009033203125, 7.3817138671875, 7.75439453125, 8.1270751953125, 8.499755859375, 8.8724365234375, 9.2451171875, 9.6177978515625, 9.990478515625, 10.3631591796875, 10.73583984375, 11.1085205078125, 11.481201171875, 11.8538818359375, 12.2265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 10.0, 20.0, 27.0, 34.0, 35.0, 77.0, 93.0, 161.0, 244.0, 315.0, 476.0, 749.0, 1088.0, 1545.0, 2277.0, 3284.0, 4856.0, 7444.0, 11406.0, 17423.0, 27365.0, 44119.0, 71367.0, 119476.0, 257228.0, 1206894.0, 121969.0, 71938.0, 44924.0, 28021.0, 17832.0, 11426.0, 7538.0, 4988.0, 3250.0, 2252.0, 1566.0, 1068.0, 752.0, 504.0, 349.0, 246.0, 165.0, 120.0, 72.0, 47.0, 34.0, 20.0, 9.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.192138671875, -0.18631935119628906, -0.18050003051757812, -0.1746807098388672, -0.16886138916015625, -0.1630420684814453, -0.15722274780273438, -0.15140342712402344, -0.1455841064453125, -0.13976478576660156, -0.13394546508789062, -0.1281261444091797, -0.12230682373046875, -0.11648750305175781, -0.11066818237304688, -0.10484886169433594, -0.099029541015625, -0.09321022033691406, -0.08739089965820312, -0.08157157897949219, -0.07575225830078125, -0.06993293762207031, -0.06411361694335938, -0.05829429626464844, -0.0524749755859375, -0.04665565490722656, -0.040836334228515625, -0.03501701354980469, -0.02919769287109375, -0.023378372192382812, -0.017559051513671875, -0.011739730834960938, -0.00592041015625, -0.0001010894775390625, 0.005718231201171875, 0.011537551879882812, 0.01735687255859375, 0.023176193237304688, 0.028995513916015625, 0.03481483459472656, 0.0406341552734375, 0.04645347595214844, 0.052272796630859375, 0.05809211730957031, 0.06391143798828125, 0.06973075866699219, 0.07555007934570312, 0.08136940002441406, 0.087188720703125, 0.09300804138183594, 0.09882736206054688, 0.10464668273925781, 0.11046600341796875, 0.11628532409667969, 0.12210464477539062, 0.12792396545410156, 0.1337432861328125, 0.13956260681152344, 0.14538192749023438, 0.1512012481689453, 0.15702056884765625, 0.1628398895263672, 0.16865921020507812, 0.17447853088378906, 0.1802978515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 7.0, 3.0, 4.0, 11.0, 18.0, 16.0, 22.0, 23.0, 29.0, 20.0, 28.0, 40.0, 43.0, 39.0, 66.0, 102.0, 111.0, 67.0, 55.0, 35.0, 42.0, 31.0, 20.0, 29.0, 16.0, 14.0, 13.0, 11.0, 12.0, 9.0, 9.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003871992230415344, -0.00037433207035064697, -0.0003614649176597595, -0.00034859776496887207, -0.0003357306122779846, -0.00032286345958709717, -0.0003099963068962097, -0.00029712915420532227, -0.0002842620015144348, -0.00027139484882354736, -0.0002585276961326599, -0.00024566054344177246, -0.000232793390750885, -0.00021992623805999756, -0.0002070590853691101, -0.00019419193267822266, -0.0001813247799873352, -0.00016845762729644775, -0.0001555904746055603, -0.00014272332191467285, -0.0001298561692237854, -0.00011698901653289795, -0.0001041218638420105, -9.125471115112305e-05, -7.83875584602356e-05, -6.552040576934814e-05, -5.265325307846069e-05, -3.978610038757324e-05, -2.691894769668579e-05, -1.405179500579834e-05, -1.1846423149108887e-06, 1.1682510375976562e-05, 2.4549663066864014e-05, 3.7416815757751465e-05, 5.0283968448638916e-05, 6.315112113952637e-05, 7.601827383041382e-05, 8.888542652130127e-05, 0.00010175257921218872, 0.00011461973190307617, 0.00012748688459396362, 0.00014035403728485107, 0.00015322118997573853, 0.00016608834266662598, 0.00017895549535751343, 0.00019182264804840088, 0.00020468980073928833, 0.00021755695343017578, 0.00023042410612106323, 0.00024329125881195068, 0.00025615841150283813, 0.0002690255641937256, 0.00028189271688461304, 0.0002947598695755005, 0.00030762702226638794, 0.0003204941749572754, 0.00033336132764816284, 0.0003462284803390503, 0.00035909563302993774, 0.0003719627857208252, 0.00038482993841171265, 0.0003976970911026001, 0.00041056424379348755, 0.000423431396484375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 12.0, 7.0, 14.0, 20.0, 14.0, 22.0, 37.0, 43.0, 59.0, 81.0, 133.0, 232.0, 540.0, 3175.0, 1023569.0, 18884.0, 799.0, 293.0, 172.0, 100.0, 69.0, 36.0, 43.0, 35.0, 25.0, 22.0, 19.0, 18.0, 2.0, 7.0, 5.0, 12.0, 6.0, 7.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00942230224609375, -0.00913381576538086, -0.008845329284667969, -0.008556842803955078, -0.008268356323242188, -0.007979869842529297, -0.007691383361816406, -0.007402896881103516, -0.007114410400390625, -0.006825923919677734, -0.006537437438964844, -0.006248950958251953, -0.0059604644775390625, -0.005671977996826172, -0.005383491516113281, -0.005095005035400391, -0.0048065185546875, -0.004518032073974609, -0.004229545593261719, -0.003941059112548828, -0.0036525726318359375, -0.003364086151123047, -0.0030755996704101562, -0.0027871131896972656, -0.002498626708984375, -0.0022101402282714844, -0.0019216537475585938, -0.0016331672668457031, -0.0013446807861328125, -0.0010561943054199219, -0.0007677078247070312, -0.0004792213439941406, -0.00019073486328125, 9.775161743164062e-05, 0.00038623809814453125, 0.0006747245788574219, 0.0009632110595703125, 0.0012516975402832031, 0.0015401840209960938, 0.0018286705017089844, 0.002117156982421875, 0.0024056434631347656, 0.0026941299438476562, 0.002982616424560547, 0.0032711029052734375, 0.003559589385986328, 0.0038480758666992188, 0.004136562347412109, 0.004425048828125, 0.004713535308837891, 0.005002021789550781, 0.005290508270263672, 0.0055789947509765625, 0.005867481231689453, 0.006155967712402344, 0.006444454193115234, 0.006732940673828125, 0.007021427154541016, 0.007309913635253906, 0.007598400115966797, 0.007886886596679688, 0.008175373077392578, 0.008463859558105469, 0.00875234603881836, 0.00904083251953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 262.0, 748.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024615549482405186, -0.0023176034446805716, -0.0021736519411206245, -0.0020297004375606775, -0.0018857489340007305, -0.0017417974304407835, -0.0015978459268808365, -0.0014538944233208895, -0.0013099429197609425, -0.0011659914162009954, -0.0010220399126410484, -0.0008780884090811014, -0.0007341369055211544, -0.0005901854019612074, -0.0004462338984012604, -0.00030228239484131336, -0.00015833089128136635, -1.4379387721419334e-05, 0.00012957211583852768, 0.0002735236193984747, 0.0004174751229584217, 0.0005614266265183687, 0.0007053781300783157, 0.0008493296336382627, 0.0009932811371982098, 0.0011372326407581568, 0.0012811841443181038, 0.0014251356478780508, 0.0015690871514379978, 0.0017130386549979448, 0.0018569901585578918, 0.002000941662117839, 0.0021448927000164986, 0.0022888442035764456, 0.0024327957071363926, 0.0025767472106963396, 0.0027206987142562866, 0.0028646502178162336, 0.0030086017213761806, 0.0031525532249361277, 0.0032965047284960747, 0.0034404562320560217, 0.0035844077356159687, 0.0037283592391759157, 0.0038723107427358627, 0.004016262479126453, 0.004160213749855757, 0.00430416502058506, 0.004448116756975651, 0.0045920684933662415, 0.004736019764095545, 0.004879971034824848, 0.005023922771215439, 0.0051678745076060295, 0.005311825778335333, 0.005455777049064636, 0.005599728785455227, 0.0057436805218458176, 0.005887631792575121, 0.006031583063304424, 0.006175534799695015, 0.006319486536085606, 0.006463437806814909, 0.006607389077544212, 0.006751340813934803]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 21.0, 30.0, 40.0, 63.0, 69.0, 77.0, 107.0, 106.0, 94.0, 83.0, 85.0, 64.0, 61.0, 29.0, 22.0, 16.0, 11.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043714046478271484, -0.0004170164465904236, -0.0003968924283981323, -0.00037676841020584106, -0.0003566443920135498, -0.00033652037382125854, -0.0003163963556289673, -0.000296272337436676, -0.00027614831924438477, -0.0002560243010520935, -0.00023590028285980225, -0.00021577626466751099, -0.00019565224647521973, -0.00017552822828292847, -0.0001554042100906372, -0.00013528019189834595, -0.00011515617370605469, -9.503215551376343e-05, -7.490813732147217e-05, -5.478411912918091e-05, -3.466010093688965e-05, -1.4536082744598389e-05, 5.587935447692871e-06, 2.571195363998413e-05, 4.583597183227539e-05, 6.595999002456665e-05, 8.608400821685791e-05, 0.00010620802640914917, 0.00012633204460144043, 0.0001464560627937317, 0.00016658008098602295, 0.0001867040991783142, 0.00020682811737060547, 0.00022695213556289673, 0.000247076153755188, 0.00026720017194747925, 0.0002873241901397705, 0.00030744820833206177, 0.00032757222652435303, 0.0003476962447166443, 0.00036782026290893555, 0.0003879442811012268, 0.00040806829929351807, 0.0004281923174858093, 0.0004483163356781006, 0.00046844035387039185, 0.0004885643720626831, 0.0005086883902549744, 0.0005288124084472656, 0.0005489364266395569, 0.0005690604448318481, 0.0005891844630241394, 0.0006093084812164307, 0.0006294324994087219, 0.0006495565176010132, 0.0006696805357933044, 0.0006898045539855957, 0.000709928572177887, 0.0007300525903701782, 0.0007501766085624695, 0.0007703006267547607, 0.000790424644947052, 0.0008105486631393433, 0.0008306726813316345, 0.0008507966995239258]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 13.0, 17.0, 20.0, 36.0, 53.0, 73.0, 110.0, 156.0, 238.0, 395.0, 572.0, 949.0, 1464.0, 2347.0, 3611.0, 5898.0, 9482.0, 16701.0, 31602.0, 72078.0, 239854.0, 445265.0, 118102.0, 45072.0, 22132.0, 12451.0, 7325.0, 4499.0, 2908.0, 1779.0, 1214.0, 682.0, 471.0, 324.0, 188.0, 156.0, 103.0, 64.0, 36.0, 32.0, 18.0, 16.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.59375, -19.97412109375, -19.3544921875, -18.73486328125, -18.115234375, -17.49560546875, -16.8759765625, -16.25634765625, -15.63671875, -15.01708984375, -14.3974609375, -13.77783203125, -13.158203125, -12.53857421875, -11.9189453125, -11.29931640625, -10.6796875, -10.06005859375, -9.4404296875, -8.82080078125, -8.201171875, -7.58154296875, -6.9619140625, -6.34228515625, -5.72265625, -5.10302734375, -4.4833984375, -3.86376953125, -3.244140625, -2.62451171875, -2.0048828125, -1.38525390625, -0.765625, -0.14599609375, 0.4736328125, 1.09326171875, 1.712890625, 2.33251953125, 2.9521484375, 3.57177734375, 4.19140625, 4.81103515625, 5.4306640625, 6.05029296875, 6.669921875, 7.28955078125, 7.9091796875, 8.52880859375, 9.1484375, 9.76806640625, 10.3876953125, 11.00732421875, 11.626953125, 12.24658203125, 12.8662109375, 13.48583984375, 14.10546875, 14.72509765625, 15.3447265625, 15.96435546875, 16.583984375, 17.20361328125, 17.8232421875, 18.44287109375, 19.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 11.0, 5.0, 3.0, 8.0, 16.0, 26.0, 28.0, 17.0, 35.0, 27.0, 44.0, 30.0, 30.0, 55.0, 76.0, 108.0, 205.0, 1585.0, 207.0, 92.0, 68.0, 56.0, 51.0, 40.0, 33.0, 37.0, 20.0, 27.0, 24.0, 21.0, 19.0, 7.0, 9.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.59375, -47.14599609375, -45.6982421875, -44.25048828125, -42.802734375, -41.35498046875, -39.9072265625, -38.45947265625, -37.01171875, -35.56396484375, -34.1162109375, -32.66845703125, -31.220703125, -29.77294921875, -28.3251953125, -26.87744140625, -25.4296875, -23.98193359375, -22.5341796875, -21.08642578125, -19.638671875, -18.19091796875, -16.7431640625, -15.29541015625, -13.84765625, -12.39990234375, -10.9521484375, -9.50439453125, -8.056640625, -6.60888671875, -5.1611328125, -3.71337890625, -2.265625, -0.81787109375, 0.6298828125, 2.07763671875, 3.525390625, 4.97314453125, 6.4208984375, 7.86865234375, 9.31640625, 10.76416015625, 12.2119140625, 13.65966796875, 15.107421875, 16.55517578125, 18.0029296875, 19.45068359375, 20.8984375, 22.34619140625, 23.7939453125, 25.24169921875, 26.689453125, 28.13720703125, 29.5849609375, 31.03271484375, 32.48046875, 33.92822265625, 35.3759765625, 36.82373046875, 38.271484375, 39.71923828125, 41.1669921875, 42.61474609375, 44.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 13.0, 3.0, 7.0, 16.0, 26.0, 31.0, 28.0, 40.0, 64.0, 92.0, 133.0, 219.0, 364.0, 941.0, 2336.0, 7172.0, 24958.0, 150872.0, 2749073.0, 170117.0, 26890.0, 7786.0, 2452.0, 953.0, 362.0, 246.0, 119.0, 108.0, 54.0, 36.0, 41.0, 33.0, 15.0, 16.0, 19.0, 13.0, 5.0, 7.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.34375, -50.734375, -49.125, -47.515625, -45.90625, -44.296875, -42.6875, -41.078125, -39.46875, -37.859375, -36.25, -34.640625, -33.03125, -31.421875, -29.8125, -28.203125, -26.59375, -24.984375, -23.375, -21.765625, -20.15625, -18.546875, -16.9375, -15.328125, -13.71875, -12.109375, -10.5, -8.890625, -7.28125, -5.671875, -4.0625, -2.453125, -0.84375, 0.765625, 2.375, 3.984375, 5.59375, 7.203125, 8.8125, 10.421875, 12.03125, 13.640625, 15.25, 16.859375, 18.46875, 20.078125, 21.6875, 23.296875, 24.90625, 26.515625, 28.125, 29.734375, 31.34375, 32.953125, 34.5625, 36.171875, 37.78125, 39.390625, 41.0, 42.609375, 44.21875, 45.828125, 47.4375, 49.046875, 50.65625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 47.0, 390.0, 494.0, 71.0, 10.0, 1.0, 1.0, 1.0], "bins": [-779.1015625, -765.6905517578125, -752.279541015625, -738.8685302734375, -725.4574584960938, -712.0464477539062, -698.6354370117188, -685.2244262695312, -671.8134155273438, -658.4024047851562, -644.9913940429688, -631.580322265625, -618.1693115234375, -604.75830078125, -591.3472900390625, -577.936279296875, -564.5252685546875, -551.1142578125, -537.7032470703125, -524.292236328125, -510.8811950683594, -497.47015380859375, -484.05914306640625, -470.64813232421875, -457.237060546875, -443.8260498046875, -430.4150085449219, -417.0039978027344, -403.5929870605469, -390.18194580078125, -376.77093505859375, -363.35992431640625, -349.9489440917969, -336.5379333496094, -323.12689208984375, -309.71588134765625, -296.30487060546875, -282.89385986328125, -269.4828186035156, -256.0718078613281, -242.66078186035156, -229.249755859375, -215.8387451171875, -202.42771911621094, -189.01669311523438, -175.60568237304688, -162.1946563720703, -148.78363037109375, -135.37261962890625, -121.96160125732422, -108.55058288574219, -95.13955688476562, -81.7285385131836, -68.31752014160156, -54.906494140625, -41.49547576904297, -28.084457397460938, -14.673437118530273, -1.2624168395996094, 12.148605346679688, 25.55962371826172, 38.97064208984375, 52.38166809082031, 65.79268646240234, 79.20370483398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 8.0, 6.0, 8.0, 16.0, 12.0, 11.0, 19.0, 19.0, 17.0, 16.0, 24.0, 24.0, 27.0, 29.0, 34.0, 26.0, 36.0, 40.0, 25.0, 37.0, 45.0, 37.0, 34.0, 38.0, 43.0, 41.0, 41.0, 33.0, 22.0, 34.0, 21.0, 15.0, 22.0, 23.0, 18.0, 19.0, 8.0, 9.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.95767211914062, -83.10855102539062, -80.25942993164062, -77.41031646728516, -74.56119537353516, -71.71207427978516, -68.86296081542969, -66.01383972167969, -63.16471862792969, -60.31559753417969, -57.46648025512695, -54.61736297607422, -51.76824188232422, -48.91912078857422, -46.070003509521484, -43.22088623046875, -40.37176513671875, -37.52264404296875, -34.673526763916016, -31.82440757751465, -28.97528839111328, -26.126169204711914, -23.277050018310547, -20.42793083190918, -17.578811645507812, -14.729692459106445, -11.880573272705078, -9.031454086303711, -6.182334899902344, -3.3332157135009766, -0.4840965270996094, 2.365022659301758, 5.214134216308594, 8.063253402709961, 10.912372589111328, 13.761491775512695, 16.610610961914062, 19.45973014831543, 22.308849334716797, 25.157968521118164, 28.00708770751953, 30.8562068939209, 33.705326080322266, 36.554443359375, 39.403564453125, 42.252685546875, 45.101802825927734, 47.95092010498047, 50.80004119873047, 53.64916229248047, 56.4982795715332, 59.34739685058594, 62.19651794433594, 65.04563903808594, 67.89476013183594, 70.7438735961914, 73.5929946899414, 76.4421157836914, 79.29122924804688, 82.14035034179688, 84.98947143554688, 87.83859252929688, 90.68771362304688, 93.53682708740234, 96.38594818115234]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 11.0, 10.0, 18.0, 22.0, 23.0, 24.0, 28.0, 33.0, 38.0, 29.0, 40.0, 35.0, 41.0, 42.0, 42.0, 49.0, 39.0, 48.0, 39.0, 62.0, 46.0, 40.0, 33.0, 18.0, 32.0, 26.0, 24.0, 27.0, 18.0, 14.0, 11.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.453125, -19.849853515625, -19.24658203125, -18.643310546875, -18.0400390625, -17.436767578125, -16.83349609375, -16.230224609375, -15.626953125, -15.023681640625, -14.42041015625, -13.817138671875, -13.2138671875, -12.610595703125, -12.00732421875, -11.404052734375, -10.80078125, -10.197509765625, -9.59423828125, -8.990966796875, -8.3876953125, -7.784423828125, -7.18115234375, -6.577880859375, -5.974609375, -5.371337890625, -4.76806640625, -4.164794921875, -3.5615234375, -2.958251953125, -2.35498046875, -1.751708984375, -1.1484375, -0.545166015625, 0.05810546875, 0.661376953125, 1.2646484375, 1.867919921875, 2.47119140625, 3.074462890625, 3.677734375, 4.281005859375, 4.88427734375, 5.487548828125, 6.0908203125, 6.694091796875, 7.29736328125, 7.900634765625, 8.50390625, 9.107177734375, 9.71044921875, 10.313720703125, 10.9169921875, 11.520263671875, 12.12353515625, 12.726806640625, 13.330078125, 13.933349609375, 14.53662109375, 15.139892578125, 15.7431640625, 16.346435546875, 16.94970703125, 17.552978515625, 18.15625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 14.0, 22.0, 28.0, 30.0, 35.0, 48.0, 58.0, 75.0, 85.0, 116.0, 183.0, 283.0, 652.0, 2020.0, 13444.0, 2764806.0, 1397797.0, 11174.0, 1758.0, 542.0, 298.0, 171.0, 133.0, 85.0, 64.0, 56.0, 47.0, 33.0, 24.0, 18.0, 19.0, 20.0, 16.0, 15.0, 14.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-128.875, -124.96484375, -121.0546875, -117.14453125, -113.234375, -109.32421875, -105.4140625, -101.50390625, -97.59375, -93.68359375, -89.7734375, -85.86328125, -81.953125, -78.04296875, -74.1328125, -70.22265625, -66.3125, -62.40234375, -58.4921875, -54.58203125, -50.671875, -46.76171875, -42.8515625, -38.94140625, -35.03125, -31.12109375, -27.2109375, -23.30078125, -19.390625, -15.48046875, -11.5703125, -7.66015625, -3.75, 0.16015625, 4.0703125, 7.98046875, 11.890625, 15.80078125, 19.7109375, 23.62109375, 27.53125, 31.44140625, 35.3515625, 39.26171875, 43.171875, 47.08203125, 50.9921875, 54.90234375, 58.8125, 62.72265625, 66.6328125, 70.54296875, 74.453125, 78.36328125, 82.2734375, 86.18359375, 90.09375, 94.00390625, 97.9140625, 101.82421875, 105.734375, 109.64453125, 113.5546875, 117.46484375, 121.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 15.0, 22.0, 20.0, 20.0, 38.0, 31.0, 50.0, 93.0, 133.0, 221.0, 306.0, 554.0, 756.0, 642.0, 361.0, 231.0, 128.0, 84.0, 65.0, 54.0, 35.0, 29.0, 27.0, 20.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-24.640625, -23.908935546875, -23.17724609375, -22.445556640625, -21.7138671875, -20.982177734375, -20.25048828125, -19.518798828125, -18.787109375, -18.055419921875, -17.32373046875, -16.592041015625, -15.8603515625, -15.128662109375, -14.39697265625, -13.665283203125, -12.93359375, -12.201904296875, -11.47021484375, -10.738525390625, -10.0068359375, -9.275146484375, -8.54345703125, -7.811767578125, -7.080078125, -6.348388671875, -5.61669921875, -4.885009765625, -4.1533203125, -3.421630859375, -2.68994140625, -1.958251953125, -1.2265625, -0.494873046875, 0.23681640625, 0.968505859375, 1.7001953125, 2.431884765625, 3.16357421875, 3.895263671875, 4.626953125, 5.358642578125, 6.09033203125, 6.822021484375, 7.5537109375, 8.285400390625, 9.01708984375, 9.748779296875, 10.48046875, 11.212158203125, 11.94384765625, 12.675537109375, 13.4072265625, 14.138916015625, 14.87060546875, 15.602294921875, 16.333984375, 17.065673828125, 17.79736328125, 18.529052734375, 19.2607421875, 19.992431640625, 20.72412109375, 21.455810546875, 22.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 11.0, 20.0, 24.0, 27.0, 31.0, 59.0, 86.0, 129.0, 224.0, 614.0, 1987.0, 7831.0, 43538.0, 983151.0, 3077974.0, 64004.0, 10664.0, 2467.0, 710.0, 309.0, 118.0, 89.0, 52.0, 37.0, 45.0, 19.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.1875, -70.833984375, -68.48046875, -66.126953125, -63.7734375, -61.419921875, -59.06640625, -56.712890625, -54.359375, -52.005859375, -49.65234375, -47.298828125, -44.9453125, -42.591796875, -40.23828125, -37.884765625, -35.53125, -33.177734375, -30.82421875, -28.470703125, -26.1171875, -23.763671875, -21.41015625, -19.056640625, -16.703125, -14.349609375, -11.99609375, -9.642578125, -7.2890625, -4.935546875, -2.58203125, -0.228515625, 2.125, 4.478515625, 6.83203125, 9.185546875, 11.5390625, 13.892578125, 16.24609375, 18.599609375, 20.953125, 23.306640625, 25.66015625, 28.013671875, 30.3671875, 32.720703125, 35.07421875, 37.427734375, 39.78125, 42.134765625, 44.48828125, 46.841796875, 49.1953125, 51.548828125, 53.90234375, 56.255859375, 58.609375, 60.962890625, 63.31640625, 65.669921875, 68.0234375, 70.376953125, 72.73046875, 75.083984375, 77.4375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 30.0, 318.0, 575.0, 81.0, 12.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.22539520263672, -56.66133117675781, -39.09726333618164, -21.53319549560547, -3.9691314697265625, 13.594932556152344, 31.15900421142578, 48.72306823730469, 66.2871322631836, 83.8511962890625, 101.41526794433594, 118.97933197021484, 136.54339599609375, 154.10745239257812, 171.67153930664062, 189.235595703125, 206.79965209960938, 224.3637237548828, 241.9277801513672, 259.4918518066406, 277.055908203125, 294.6199951171875, 312.1840515136719, 329.74810791015625, 347.31219482421875, 364.8762512207031, 382.4403381347656, 400.00439453125, 417.5684509277344, 435.13250732421875, 452.69659423828125, 470.2606506347656, 487.82476806640625, 505.3888244628906, 522.952880859375, 540.5169677734375, 558.0810546875, 575.6450805664062, 593.2091674804688, 610.7732543945312, 628.3372802734375, 645.9013671875, 663.4653930664062, 681.0294799804688, 698.5935668945312, 716.1575927734375, 733.7216796875, 751.2857666015625, 768.849853515625, 786.4139404296875, 803.9779663085938, 821.5420532226562, 839.1061401367188, 856.670166015625, 874.2342529296875, 891.79833984375, 909.3623657226562, 926.9264526367188, 944.490478515625, 962.0545654296875, 979.61865234375, 997.1826782226562, 1014.7467651367188, 1032.310791015625, 1049.8748779296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 12.0, 12.0, 18.0, 23.0, 19.0, 24.0, 28.0, 19.0, 31.0, 34.0, 46.0, 27.0, 42.0, 44.0, 35.0, 45.0, 51.0, 31.0, 45.0, 46.0, 36.0, 41.0, 44.0, 34.0, 30.0, 26.0, 20.0, 25.0, 28.0, 19.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-89.94453430175781, -87.46626281738281, -84.98799133300781, -82.50971221923828, -80.03144073486328, -77.55316925048828, -75.07489776611328, -72.59661865234375, -70.11834716796875, -67.64007568359375, -65.16180419921875, -62.683528900146484, -60.20525360107422, -57.72698211669922, -55.24871063232422, -52.77043533325195, -50.29216384887695, -47.81389236450195, -45.33561706542969, -42.85734558105469, -40.37907028198242, -37.90079879760742, -35.422523498535156, -32.944252014160156, -30.465978622436523, -27.98770523071289, -25.509431838989258, -23.031158447265625, -20.552886962890625, -18.07461166381836, -15.59634017944336, -13.118066787719727, -10.639793395996094, -8.161520004272461, -5.683247089385986, -3.2049741744995117, -0.7267007827758789, 1.751572608947754, 4.22984504699707, 6.708118438720703, 9.186391830444336, 11.664665222167969, 14.142938613891602, 16.621212005615234, 19.099483489990234, 21.5777587890625, 24.0560302734375, 26.534303665161133, 29.012577056884766, 31.4908504486084, 33.96912384033203, 36.44739532470703, 38.9256706237793, 41.4039421081543, 43.88221740722656, 46.36048889160156, 48.83876037597656, 51.31703186035156, 53.79530715942383, 56.27357864379883, 58.751853942871094, 61.230125427246094, 63.708396911621094, 66.18667602539062, 68.66494750976562]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 23.0, 22.0, 46.0, 67.0, 81.0, 127.0, 194.0, 319.0, 484.0, 747.0, 1242.0, 2112.0, 3394.0, 5707.0, 9716.0, 17037.0, 30133.0, 53334.0, 95703.0, 174369.0, 263436.0, 172646.0, 94221.0, 52546.0, 29770.0, 17031.0, 9626.0, 5690.0, 3331.0, 2030.0, 1271.0, 722.0, 484.0, 306.0, 198.0, 138.0, 82.0, 50.0, 29.0, 28.0, 12.0, 17.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.384033203125, -0.3718376159667969, -0.35964202880859375, -0.3474464416503906, -0.3352508544921875, -0.3230552673339844, -0.31085968017578125, -0.2986640930175781, -0.286468505859375, -0.2742729187011719, -0.26207733154296875, -0.24988174438476562, -0.2376861572265625, -0.22549057006835938, -0.21329498291015625, -0.20109939575195312, -0.18890380859375, -0.17670822143554688, -0.16451263427734375, -0.15231704711914062, -0.1401214599609375, -0.12792587280273438, -0.11573028564453125, -0.10353469848632812, -0.091339111328125, -0.07914352416992188, -0.06694793701171875, -0.054752349853515625, -0.0425567626953125, -0.030361175537109375, -0.01816558837890625, -0.005970001220703125, 0.0062255859375, 0.018421173095703125, 0.03061676025390625, 0.042812347412109375, 0.0550079345703125, 0.06720352172851562, 0.07939910888671875, 0.09159469604492188, 0.103790283203125, 0.11598587036132812, 0.12818145751953125, 0.14037704467773438, 0.1525726318359375, 0.16476821899414062, 0.17696380615234375, 0.18915939331054688, 0.20135498046875, 0.21355056762695312, 0.22574615478515625, 0.23794174194335938, 0.2501373291015625, 0.2623329162597656, 0.27452850341796875, 0.2867240905761719, 0.298919677734375, 0.3111152648925781, 0.32331085205078125, 0.3355064392089844, 0.3477020263671875, 0.3598976135253906, 0.37209320068359375, 0.3842887878417969, 0.396484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 8.0, 15.0, 10.0, 16.0, 17.0, 17.0, 28.0, 28.0, 28.0, 28.0, 33.0, 28.0, 44.0, 31.0, 35.0, 41.0, 41.0, 1058.0, 36.0, 51.0, 48.0, 38.0, 29.0, 32.0, 24.0, 34.0, 29.0, 25.0, 33.0, 16.0, 16.0, 20.0, 8.0, 12.0, 12.0, 10.0, 4.0, 5.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.01171875, -9.6640625, -9.31640625, -8.96875, -8.62109375, -8.2734375, -7.92578125, -7.578125, -7.23046875, -6.8828125, -6.53515625, -6.1875, -5.83984375, -5.4921875, -5.14453125, -4.796875, -4.44921875, -4.1015625, -3.75390625, -3.40625, -3.05859375, -2.7109375, -2.36328125, -2.015625, -1.66796875, -1.3203125, -0.97265625, -0.625, -0.27734375, 0.0703125, 0.41796875, 0.765625, 1.11328125, 1.4609375, 1.80859375, 2.15625, 2.50390625, 2.8515625, 3.19921875, 3.546875, 3.89453125, 4.2421875, 4.58984375, 4.9375, 5.28515625, 5.6328125, 5.98046875, 6.328125, 6.67578125, 7.0234375, 7.37109375, 7.71875, 8.06640625, 8.4140625, 8.76171875, 9.109375, 9.45703125, 9.8046875, 10.15234375, 10.5, 10.84765625, 11.1953125, 11.54296875, 11.890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 14.0, 35.0, 50.0, 91.0, 138.0, 204.0, 400.0, 595.0, 882.0, 1357.0, 2019.0, 3322.0, 5350.0, 8697.0, 14370.0, 23701.0, 39814.0, 67846.0, 120329.0, 233289.0, 1275200.0, 125342.0, 70060.0, 41203.0, 24498.0, 14439.0, 8934.0, 5454.0, 3475.0, 2125.0, 1397.0, 920.0, 613.0, 372.0, 235.0, 139.0, 84.0, 45.0, 18.0, 13.0, 11.0, 12.0, 4.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19811439514160156, -0.19151687622070312, -0.1849193572998047, -0.17832183837890625, -0.1717243194580078, -0.16512680053710938, -0.15852928161621094, -0.1519317626953125, -0.14533424377441406, -0.13873672485351562, -0.1321392059326172, -0.12554168701171875, -0.11894416809082031, -0.11234664916992188, -0.10574913024902344, -0.099151611328125, -0.09255409240722656, -0.08595657348632812, -0.07935905456542969, -0.07276153564453125, -0.06616401672363281, -0.059566497802734375, -0.05296897888183594, -0.0463714599609375, -0.03977394104003906, -0.033176422119140625, -0.026578903198242188, -0.01998138427734375, -0.013383865356445312, -0.006786346435546875, -0.0001888275146484375, 0.00640869140625, 0.013006210327148438, 0.019603729248046875, 0.026201248168945312, 0.03279876708984375, 0.03939628601074219, 0.045993804931640625, 0.05259132385253906, 0.0591888427734375, 0.06578636169433594, 0.07238388061523438, 0.07898139953613281, 0.08557891845703125, 0.09217643737792969, 0.09877395629882812, 0.10537147521972656, 0.111968994140625, 0.11856651306152344, 0.12516403198242188, 0.1317615509033203, 0.13835906982421875, 0.1449565887451172, 0.15155410766601562, 0.15815162658691406, 0.1647491455078125, 0.17134666442871094, 0.17794418334960938, 0.1845417022705078, 0.19113922119140625, 0.1977367401123047, 0.20433425903320312, 0.21093177795410156, 0.217529296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 6.0, 14.0, 16.0, 18.0, 36.0, 50.0, 54.0, 82.0, 141.0, 147.0, 107.0, 81.0, 59.0, 45.0, 28.0, 19.0, 20.0, 13.0, 7.0, 7.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003809928894042969, -0.0003670230507850647, -0.0003530532121658325, -0.00033908337354660034, -0.00032511353492736816, -0.000311143696308136, -0.0002971738576889038, -0.00028320401906967163, -0.00026923418045043945, -0.0002552643418312073, -0.0002412945032119751, -0.00022732466459274292, -0.00021335482597351074, -0.00019938498735427856, -0.0001854151487350464, -0.0001714453101158142, -0.00015747547149658203, -0.00014350563287734985, -0.00012953579425811768, -0.0001155659556388855, -0.00010159611701965332, -8.762627840042114e-05, -7.365643978118896e-05, -5.968660116195679e-05, -4.571676254272461e-05, -3.174692392349243e-05, -1.7777085304260254e-05, -3.807246685028076e-06, 1.0162591934204102e-05, 2.413243055343628e-05, 3.810226917266846e-05, 5.2072107791900635e-05, 6.604194641113281e-05, 8.001178503036499e-05, 9.398162364959717e-05, 0.00010795146226882935, 0.00012192130088806152, 0.0001358911395072937, 0.00014986097812652588, 0.00016383081674575806, 0.00017780065536499023, 0.0001917704939842224, 0.0002057403326034546, 0.00021971017122268677, 0.00023368000984191895, 0.0002476498484611511, 0.0002616196870803833, 0.0002755895256996155, 0.00028955936431884766, 0.00030352920293807983, 0.000317499041557312, 0.0003314688801765442, 0.00034543871879577637, 0.00035940855741500854, 0.0003733783960342407, 0.0003873482346534729, 0.0004013180732727051, 0.00041528791189193726, 0.00042925775051116943, 0.0004432275891304016, 0.0004571974277496338, 0.00047116726636886597, 0.00048513710498809814, 0.0004991069436073303, 0.0005130767822265625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 20.0, 33.0, 38.0, 57.0, 94.0, 166.0, 358.0, 1598.0, 1023800.0, 21245.0, 555.0, 227.0, 108.0, 71.0, 38.0, 19.0, 24.0, 12.0, 8.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0111846923828125, -0.010880231857299805, -0.01057577133178711, -0.010271310806274414, -0.009966850280761719, -0.009662389755249023, -0.009357929229736328, -0.009053468704223633, -0.008749008178710938, -0.008444547653198242, -0.008140087127685547, -0.007835626602172852, -0.007531166076660156, -0.007226705551147461, -0.006922245025634766, -0.00661778450012207, -0.006313323974609375, -0.00600886344909668, -0.005704402923583984, -0.005399942398071289, -0.005095481872558594, -0.0047910213470458984, -0.004486560821533203, -0.004182100296020508, -0.0038776397705078125, -0.003573179244995117, -0.003268718719482422, -0.0029642581939697266, -0.0026597976684570312, -0.002355337142944336, -0.0020508766174316406, -0.0017464160919189453, -0.00144195556640625, -0.0011374950408935547, -0.0008330345153808594, -0.0005285739898681641, -0.00022411346435546875, 8.034706115722656e-05, 0.0003848075866699219, 0.0006892681121826172, 0.0009937286376953125, 0.0012981891632080078, 0.0016026496887207031, 0.0019071102142333984, 0.0022115707397460938, 0.002516031265258789, 0.0028204917907714844, 0.0031249523162841797, 0.003429412841796875, 0.0037338733673095703, 0.004038333892822266, 0.004342794418334961, 0.004647254943847656, 0.0049517154693603516, 0.005256175994873047, 0.005560636520385742, 0.0058650970458984375, 0.006169557571411133, 0.006474018096923828, 0.0067784786224365234, 0.007082939147949219, 0.007387399673461914, 0.007691860198974609, 0.007996320724487305, 0.00830078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 17.0, 251.0, 689.0, 45.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012884201714769006, -0.001239330624230206, -0.0011902411933988333, -0.0011411516461521387, -0.0010920620989054441, -0.0010429726680740714, -0.0009938831208273768, -0.0009447936317883432, -0.0008957041427493095, -0.0008466146537102759, -0.0007975251646712422, -0.0007484356174245477, -0.000699346128385514, -0.0006502566393464804, -0.0006011670920997858, -0.0005520776030607522, -0.0005029881140217185, -0.00045389862498268485, -0.00040480910683982074, -0.00035571958869695663, -0.000306630099657923, -0.00025754061061888933, -0.00020845109247602522, -0.00015936157433316112, -0.00011027208529412746, -6.118258170317858e-05, -1.2093078112229705e-05, 3.6996425478719175e-05, 8.608592906966805e-05, 0.0001351754181087017, 0.00018426493625156581, 0.00023335445439442992, 0.0002824440598487854, 0.00033153354888781905, 0.00038062306703068316, 0.00042971258517354727, 0.0004788020742125809, 0.0005278915632516146, 0.0005769811104983091, 0.0006260705995373428, 0.0006751600885763764, 0.0007242495776154101, 0.0007733390666544437, 0.0008224286139011383, 0.000871518102940172, 0.0009206075919792056, 0.0009696971392259002, 0.001018786570057273, 0.0010678761173039675, 0.001116965664550662, 0.0011660550953820348, 0.0012151446426287293, 0.001264234073460102, 0.0013133236207067966, 0.0013624131679534912, 0.0014115027152001858, 0.0014605921460315585, 0.001509681693278253, 0.0015587711241096258, 0.0016078606713563204, 0.001656950218603015, 0.0017060396494343877, 0.0017551291966810822, 0.001804218627512455, 0.0018533081747591496]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 10.0, 15.0, 27.0, 39.0, 52.0, 62.0, 63.0, 61.0, 92.0, 79.0, 67.0, 89.0, 69.0, 62.0, 53.0, 46.0, 37.0, 28.0, 16.0, 12.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00040787458419799805, -0.000395849347114563, -0.00038382411003112793, -0.00037179887294769287, -0.0003597736358642578, -0.00034774839878082275, -0.0003357231616973877, -0.00032369792461395264, -0.0003116726875305176, -0.0002996474504470825, -0.00028762221336364746, -0.0002755969762802124, -0.00026357173919677734, -0.0002515465021133423, -0.00023952126502990723, -0.00022749602794647217, -0.0002154707908630371, -0.00020344555377960205, -0.000191420316696167, -0.00017939507961273193, -0.00016736984252929688, -0.00015534460544586182, -0.00014331936836242676, -0.0001312941312789917, -0.00011926889419555664, -0.00010724365711212158, -9.521842002868652e-05, -8.319318294525146e-05, -7.11679458618164e-05, -5.914270877838135e-05, -4.711747169494629e-05, -3.509223461151123e-05, -2.3066997528076172e-05, -1.1041760444641113e-05, 9.834766387939453e-07, 1.3008713722229004e-05, 2.5033950805664062e-05, 3.705918788909912e-05, 4.908442497253418e-05, 6.110966205596924e-05, 7.31348991394043e-05, 8.516013622283936e-05, 9.718537330627441e-05, 0.00010921061038970947, 0.00012123584747314453, 0.0001332610845565796, 0.00014528632164001465, 0.0001573115587234497, 0.00016933679580688477, 0.00018136203289031982, 0.00019338726997375488, 0.00020541250705718994, 0.000217437744140625, 0.00022946298122406006, 0.00024148821830749512, 0.0002535134553909302, 0.00026553869247436523, 0.0002775639295578003, 0.00028958916664123535, 0.0003016144037246704, 0.00031363964080810547, 0.00032566487789154053, 0.0003376901149749756, 0.00034971535205841064, 0.0003617405891418457]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 8.0, 4.0, 8.0, 10.0, 20.0, 25.0, 40.0, 44.0, 70.0, 107.0, 157.0, 263.0, 368.0, 580.0, 847.0, 1306.0, 2170.0, 3275.0, 5781.0, 10134.0, 19279.0, 41619.0, 104142.0, 313633.0, 339631.0, 113461.0, 44762.0, 20934.0, 10408.0, 5877.0, 3441.0, 2190.0, 1381.0, 833.0, 566.0, 372.0, 253.0, 177.0, 132.0, 72.0, 50.0, 51.0, 19.0, 19.0, 10.0, 12.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.654052734375, -19.91748046875, -19.180908203125, -18.4443359375, -17.707763671875, -16.97119140625, -16.234619140625, -15.498046875, -14.761474609375, -14.02490234375, -13.288330078125, -12.5517578125, -11.815185546875, -11.07861328125, -10.342041015625, -9.60546875, -8.868896484375, -8.13232421875, -7.395751953125, -6.6591796875, -5.922607421875, -5.18603515625, -4.449462890625, -3.712890625, -2.976318359375, -2.23974609375, -1.503173828125, -0.7666015625, -0.030029296875, 0.70654296875, 1.443115234375, 2.1796875, 2.916259765625, 3.65283203125, 4.389404296875, 5.1259765625, 5.862548828125, 6.59912109375, 7.335693359375, 8.072265625, 8.808837890625, 9.54541015625, 10.281982421875, 11.0185546875, 11.755126953125, 12.49169921875, 13.228271484375, 13.96484375, 14.701416015625, 15.43798828125, 16.174560546875, 16.9111328125, 17.647705078125, 18.38427734375, 19.120849609375, 19.857421875, 20.593994140625, 21.33056640625, 22.067138671875, 22.8037109375, 23.540283203125, 24.27685546875, 25.013427734375, 25.75]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 10.0, 13.0, 16.0, 25.0, 21.0, 26.0, 38.0, 37.0, 40.0, 54.0, 55.0, 89.0, 138.0, 1510.0, 390.0, 140.0, 72.0, 71.0, 47.0, 46.0, 37.0, 26.0, 29.0, 21.0, 18.0, 14.0, 14.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.37158203125, -45.9306640625, -44.48974609375, -43.048828125, -41.60791015625, -40.1669921875, -38.72607421875, -37.28515625, -35.84423828125, -34.4033203125, -32.96240234375, -31.521484375, -30.08056640625, -28.6396484375, -27.19873046875, -25.7578125, -24.31689453125, -22.8759765625, -21.43505859375, -19.994140625, -18.55322265625, -17.1123046875, -15.67138671875, -14.23046875, -12.78955078125, -11.3486328125, -9.90771484375, -8.466796875, -7.02587890625, -5.5849609375, -4.14404296875, -2.703125, -1.26220703125, 0.1787109375, 1.61962890625, 3.060546875, 4.50146484375, 5.9423828125, 7.38330078125, 8.82421875, 10.26513671875, 11.7060546875, 13.14697265625, 14.587890625, 16.02880859375, 17.4697265625, 18.91064453125, 20.3515625, 21.79248046875, 23.2333984375, 24.67431640625, 26.115234375, 27.55615234375, 28.9970703125, 30.43798828125, 31.87890625, 33.31982421875, 34.7607421875, 36.20166015625, 37.642578125, 39.08349609375, 40.5244140625, 41.96533203125, 43.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 15.0, 24.0, 22.0, 29.0, 68.0, 121.0, 173.0, 350.0, 952.0, 8855.0, 3044388.0, 87297.0, 2198.0, 548.0, 254.0, 107.0, 75.0, 60.0, 32.0, 28.0, 20.0, 9.0, 14.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-185.875, -181.1982421875, -176.521484375, -171.8447265625, -167.16796875, -162.4912109375, -157.814453125, -153.1376953125, -148.4609375, -143.7841796875, -139.107421875, -134.4306640625, -129.75390625, -125.0771484375, -120.400390625, -115.7236328125, -111.046875, -106.3701171875, -101.693359375, -97.0166015625, -92.33984375, -87.6630859375, -82.986328125, -78.3095703125, -73.6328125, -68.9560546875, -64.279296875, -59.6025390625, -54.92578125, -50.2490234375, -45.572265625, -40.8955078125, -36.21875, -31.5419921875, -26.865234375, -22.1884765625, -17.51171875, -12.8349609375, -8.158203125, -3.4814453125, 1.1953125, 5.8720703125, 10.548828125, 15.2255859375, 19.90234375, 24.5791015625, 29.255859375, 33.9326171875, 38.609375, 43.2861328125, 47.962890625, 52.6396484375, 57.31640625, 61.9931640625, 66.669921875, 71.3466796875, 76.0234375, 80.7001953125, 85.376953125, 90.0537109375, 94.73046875, 99.4072265625, 104.083984375, 108.7607421875, 113.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 19.0, 679.0, 311.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.6768493652344, -420.7241516113281, -395.771484375, -370.81878662109375, -345.8660888671875, -320.9134216308594, -295.9607238769531, -271.008056640625, -246.05535888671875, -221.10267639160156, -196.14999389648438, -171.19729614257812, -146.24461364746094, -121.29193115234375, -96.3392333984375, -71.38655090332031, -46.433868408203125, -21.481182098388672, 3.4715042114257812, 28.4241943359375, 53.37687683105469, 78.32955932617188, 103.28225708007812, 128.2349395751953, 153.1876220703125, 178.1403045654297, 203.09298706054688, 228.04568481445312, 252.9983673095703, 277.9510498046875, 302.90374755859375, 327.8564453125, 352.80908203125, 377.76177978515625, 402.7144470214844, 427.6671447753906, 452.61981201171875, 477.572509765625, 502.52520751953125, 527.4779052734375, 552.4305419921875, 577.3832397460938, 602.3359375, 627.28857421875, 652.2412719726562, 677.1939697265625, 702.1466674804688, 727.099365234375, 752.0520629882812, 777.0047607421875, 801.9574584960938, 826.91015625, 851.86279296875, 876.8154907226562, 901.7681884765625, 926.7208862304688, 951.673583984375, 976.6262817382812, 1001.5789794921875, 1026.5316162109375, 1051.484375, 1076.43701171875, 1101.3896484375, 1126.3424072265625, 1151.2950439453125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 8.0, 10.0, 10.0, 26.0, 24.0, 16.0, 27.0, 38.0, 21.0, 34.0, 44.0, 43.0, 30.0, 36.0, 43.0, 43.0, 53.0, 51.0, 27.0, 52.0, 38.0, 23.0, 46.0, 38.0, 30.0, 28.0, 31.0, 20.0, 20.0, 9.0, 13.0, 14.0, 8.0, 8.0, 3.0, 4.0, 12.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.79092407226562, -101.34465789794922, -97.89839172363281, -94.4521255493164, -91.005859375, -87.5595932006836, -84.11332702636719, -80.66705322265625, -77.22079467773438, -73.77452850341797, -70.32826232910156, -66.88199615478516, -63.43572998046875, -59.989463806152344, -56.54319381713867, -53.096927642822266, -49.650657653808594, -46.20439147949219, -42.75812530517578, -39.311859130859375, -35.86559295654297, -32.41932678222656, -28.97305679321289, -25.526790618896484, -22.080524444580078, -18.634258270263672, -15.18799114227295, -11.741724014282227, -8.29545783996582, -4.849191665649414, -1.402923583984375, 2.0433425903320312, 5.4896087646484375, 8.935874938964844, 12.382142066955566, 15.828409194946289, 19.274675369262695, 22.7209415435791, 26.16720962524414, 29.613475799560547, 33.05974197387695, 36.50600814819336, 39.952274322509766, 43.39854431152344, 46.844810485839844, 50.29107666015625, 53.737342834472656, 57.18360900878906, 60.62987518310547, 64.07614135742188, 67.52240753173828, 70.96867370605469, 74.4149398803711, 77.8612060546875, 81.30747985839844, 84.75373840332031, 88.20001220703125, 91.64627838134766, 95.09254455566406, 98.53881072998047, 101.98507690429688, 105.43134307861328, 108.87760925292969, 112.32388305664062, 115.7701416015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 10.0, 15.0, 13.0, 27.0, 27.0, 25.0, 28.0, 48.0, 43.0, 39.0, 36.0, 43.0, 40.0, 47.0, 42.0, 62.0, 47.0, 47.0, 40.0, 49.0, 37.0, 31.0, 24.0, 19.0, 21.0, 19.0, 15.0, 27.0, 14.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.940185546875, -18.33349609375, -17.726806640625, -17.1201171875, -16.513427734375, -15.90673828125, -15.300048828125, -14.693359375, -14.086669921875, -13.47998046875, -12.873291015625, -12.2666015625, -11.659912109375, -11.05322265625, -10.446533203125, -9.83984375, -9.233154296875, -8.62646484375, -8.019775390625, -7.4130859375, -6.806396484375, -6.19970703125, -5.593017578125, -4.986328125, -4.379638671875, -3.77294921875, -3.166259765625, -2.5595703125, -1.952880859375, -1.34619140625, -0.739501953125, -0.1328125, 0.473876953125, 1.08056640625, 1.687255859375, 2.2939453125, 2.900634765625, 3.50732421875, 4.114013671875, 4.720703125, 5.327392578125, 5.93408203125, 6.540771484375, 7.1474609375, 7.754150390625, 8.36083984375, 8.967529296875, 9.57421875, 10.180908203125, 10.78759765625, 11.394287109375, 12.0009765625, 12.607666015625, 13.21435546875, 13.821044921875, 14.427734375, 15.034423828125, 15.64111328125, 16.247802734375, 16.8544921875, 17.461181640625, 18.06787109375, 18.674560546875, 19.28125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 10.0, 12.0, 21.0, 19.0, 27.0, 41.0, 44.0, 64.0, 82.0, 135.0, 178.0, 229.0, 385.0, 609.0, 1057.0, 1811.0, 3547.0, 8579.0, 35584.0, 420803.0, 2603901.0, 1001839.0, 90254.0, 14431.0, 4797.0, 2366.0, 1258.0, 763.0, 445.0, 280.0, 206.0, 151.0, 94.0, 54.0, 48.0, 32.0, 22.0, 21.0, 19.0, 16.0, 14.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25, -32.23291015625, -31.2158203125, -30.19873046875, -29.181640625, -28.16455078125, -27.1474609375, -26.13037109375, -25.11328125, -24.09619140625, -23.0791015625, -22.06201171875, -21.044921875, -20.02783203125, -19.0107421875, -17.99365234375, -16.9765625, -15.95947265625, -14.9423828125, -13.92529296875, -12.908203125, -11.89111328125, -10.8740234375, -9.85693359375, -8.83984375, -7.82275390625, -6.8056640625, -5.78857421875, -4.771484375, -3.75439453125, -2.7373046875, -1.72021484375, -0.703125, 0.31396484375, 1.3310546875, 2.34814453125, 3.365234375, 4.38232421875, 5.3994140625, 6.41650390625, 7.43359375, 8.45068359375, 9.4677734375, 10.48486328125, 11.501953125, 12.51904296875, 13.5361328125, 14.55322265625, 15.5703125, 16.58740234375, 17.6044921875, 18.62158203125, 19.638671875, 20.65576171875, 21.6728515625, 22.68994140625, 23.70703125, 24.72412109375, 25.7412109375, 26.75830078125, 27.775390625, 28.79248046875, 29.8095703125, 30.82666015625, 31.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 4.0, 19.0, 11.0, 18.0, 15.0, 32.0, 38.0, 56.0, 58.0, 101.0, 140.0, 252.0, 344.0, 559.0, 680.0, 556.0, 360.0, 217.0, 171.0, 107.0, 80.0, 61.0, 49.0, 28.0, 30.0, 26.0, 14.0, 8.0, 11.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.587890625, -24.69140625, -23.794921875, -22.8984375, -22.001953125, -21.10546875, -20.208984375, -19.3125, -18.416015625, -17.51953125, -16.623046875, -15.7265625, -14.830078125, -13.93359375, -13.037109375, -12.140625, -11.244140625, -10.34765625, -9.451171875, -8.5546875, -7.658203125, -6.76171875, -5.865234375, -4.96875, -4.072265625, -3.17578125, -2.279296875, -1.3828125, -0.486328125, 0.41015625, 1.306640625, 2.203125, 3.099609375, 3.99609375, 4.892578125, 5.7890625, 6.685546875, 7.58203125, 8.478515625, 9.375, 10.271484375, 11.16796875, 12.064453125, 12.9609375, 13.857421875, 14.75390625, 15.650390625, 16.546875, 17.443359375, 18.33984375, 19.236328125, 20.1328125, 21.029296875, 21.92578125, 22.822265625, 23.71875, 24.615234375, 25.51171875, 26.408203125, 27.3046875, 28.201171875, 29.09765625, 29.994140625, 30.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 12.0, 27.0, 28.0, 42.0, 76.0, 93.0, 147.0, 253.0, 466.0, 841.0, 1858.0, 4249.0, 11680.0, 40257.0, 203027.0, 2722548.0, 1058032.0, 110509.0, 25680.0, 8228.0, 3176.0, 1335.0, 707.0, 368.0, 238.0, 138.0, 73.0, 56.0, 46.0, 25.0, 17.0, 11.0, 5.0, 11.0, 3.0, 7.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.69482421875, -35.5771484375, -34.45947265625, -33.341796875, -32.22412109375, -31.1064453125, -29.98876953125, -28.87109375, -27.75341796875, -26.6357421875, -25.51806640625, -24.400390625, -23.28271484375, -22.1650390625, -21.04736328125, -19.9296875, -18.81201171875, -17.6943359375, -16.57666015625, -15.458984375, -14.34130859375, -13.2236328125, -12.10595703125, -10.98828125, -9.87060546875, -8.7529296875, -7.63525390625, -6.517578125, -5.39990234375, -4.2822265625, -3.16455078125, -2.046875, -0.92919921875, 0.1884765625, 1.30615234375, 2.423828125, 3.54150390625, 4.6591796875, 5.77685546875, 6.89453125, 8.01220703125, 9.1298828125, 10.24755859375, 11.365234375, 12.48291015625, 13.6005859375, 14.71826171875, 15.8359375, 16.95361328125, 18.0712890625, 19.18896484375, 20.306640625, 21.42431640625, 22.5419921875, 23.65966796875, 24.77734375, 25.89501953125, 27.0126953125, 28.13037109375, 29.248046875, 30.36572265625, 31.4833984375, 32.60107421875, 33.71875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 17.0, 76.0, 195.0, 324.0, 264.0, 88.0, 33.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.43685913085938, -109.78137969970703, -101.12590026855469, -92.47042083740234, -83.81494140625, -75.15946197509766, -66.50398254394531, -57.84850311279297, -49.193023681640625, -40.53754425048828, -31.882064819335938, -23.226585388183594, -14.57110595703125, -5.915626525878906, 2.7398529052734375, 11.395332336425781, 20.050811767578125, 28.70629119873047, 37.36177062988281, 46.017250061035156, 54.6727294921875, 63.328208923339844, 71.98368835449219, 80.63916778564453, 89.29464721679688, 97.95012664794922, 106.60560607910156, 115.2610855102539, 123.91656494140625, 132.57205200195312, 141.22752380371094, 149.88299560546875, 158.53848266601562, 167.1939697265625, 175.8494415283203, 184.50491333007812, 193.160400390625, 201.81588745117188, 210.4713592529297, 219.1268310546875, 227.78231811523438, 236.43780517578125, 245.09327697753906, 253.74874877929688, 262.40423583984375, 271.0597229003906, 279.7152099609375, 288.37066650390625, 297.0261535644531, 305.681640625, 314.33709716796875, 322.9925842285156, 331.6480712890625, 340.3035583496094, 348.95904541015625, 357.614501953125, 366.2699890136719, 374.92547607421875, 383.5809326171875, 392.2364196777344, 400.89190673828125, 409.5473937988281, 418.202880859375, 426.85833740234375, 435.5138244628906]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 6.0, 12.0, 9.0, 12.0, 9.0, 18.0, 25.0, 27.0, 24.0, 29.0, 39.0, 35.0, 30.0, 25.0, 46.0, 37.0, 52.0, 48.0, 47.0, 28.0, 43.0, 48.0, 41.0, 41.0, 34.0, 38.0, 26.0, 27.0, 27.0, 24.0, 12.0, 11.0, 11.0, 14.0, 9.0, 6.0, 5.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-101.22217559814453, -98.37931060791016, -95.53643798828125, -92.69357299804688, -89.8507080078125, -87.0078353881836, -84.16497039794922, -81.32209777832031, -78.47923278808594, -75.63636779785156, -72.79349517822266, -69.95063018798828, -67.10775756835938, -64.264892578125, -61.422027587890625, -58.579158782958984, -55.736289978027344, -52.8934211730957, -50.05055236816406, -47.20768737792969, -44.36481857299805, -41.521949768066406, -38.67908477783203, -35.83621597290039, -32.99334716796875, -30.15047836303711, -27.3076114654541, -24.464744567871094, -21.621875762939453, -18.779006958007812, -15.936140060424805, -13.093273162841797, -10.250411987304688, -7.407544136047363, -4.564676284790039, -1.7218084335327148, 1.1210594177246094, 3.9639272689819336, 6.806795120239258, 9.649662017822266, 12.492530822753906, 15.33539867401123, 18.178266525268555, 21.021133422851562, 23.864002227783203, 26.706871032714844, 29.54973793029785, 32.39260482788086, 35.2354736328125, 38.07834243774414, 40.92121124267578, 43.764076232910156, 46.6069450378418, 49.44981384277344, 52.29267883300781, 55.13554763793945, 57.978416442871094, 60.821285247802734, 63.664154052734375, 66.50701904296875, 69.34988403320312, 72.19275665283203, 75.0356216430664, 77.87849426269531, 80.72135925292969]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 8.0, 16.0, 29.0, 30.0, 56.0, 84.0, 125.0, 224.0, 343.0, 479.0, 799.0, 1317.0, 2047.0, 3425.0, 5521.0, 9574.0, 16255.0, 28500.0, 50813.0, 93144.0, 173349.0, 270769.0, 175473.0, 94733.0, 51388.0, 28861.0, 16646.0, 9700.0, 5720.0, 3547.0, 2072.0, 1312.0, 800.0, 498.0, 303.0, 218.0, 139.0, 73.0, 53.0, 32.0, 23.0, 22.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.30028533935546875, -0.2907562255859375, -0.28122711181640625, -0.271697998046875, -0.26216888427734375, -0.2526397705078125, -0.24311065673828125, -0.23358154296875, -0.22405242919921875, -0.2145233154296875, -0.20499420166015625, -0.195465087890625, -0.18593597412109375, -0.1764068603515625, -0.16687774658203125, -0.1573486328125, -0.14781951904296875, -0.1382904052734375, -0.12876129150390625, -0.119232177734375, -0.10970306396484375, -0.1001739501953125, -0.09064483642578125, -0.08111572265625, -0.07158660888671875, -0.0620574951171875, -0.05252838134765625, -0.042999267578125, -0.03347015380859375, -0.0239410400390625, -0.01441192626953125, -0.0048828125, 0.00464630126953125, 0.0141754150390625, 0.02370452880859375, 0.033233642578125, 0.04276275634765625, 0.0522918701171875, 0.06182098388671875, 0.07135009765625, 0.08087921142578125, 0.0904083251953125, 0.09993743896484375, 0.109466552734375, 0.11899566650390625, 0.1285247802734375, 0.13805389404296875, 0.1475830078125, 0.15711212158203125, 0.1666412353515625, 0.17617034912109375, 0.185699462890625, 0.19522857666015625, 0.2047576904296875, 0.21428680419921875, 0.22381591796875, 0.23334503173828125, 0.2428741455078125, 0.25240325927734375, 0.261932373046875, 0.27146148681640625, 0.2809906005859375, 0.29051971435546875, 0.300048828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 10.0, 18.0, 22.0, 19.0, 20.0, 38.0, 37.0, 34.0, 34.0, 34.0, 34.0, 35.0, 35.0, 44.0, 1070.0, 45.0, 46.0, 44.0, 55.0, 37.0, 36.0, 24.0, 22.0, 30.0, 31.0, 13.0, 21.0, 13.0, 18.0, 18.0, 15.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -7.998291015625, -7.69189453125, -7.385498046875, -7.0791015625, -6.772705078125, -6.46630859375, -6.159912109375, -5.853515625, -5.547119140625, -5.24072265625, -4.934326171875, -4.6279296875, -4.321533203125, -4.01513671875, -3.708740234375, -3.40234375, -3.095947265625, -2.78955078125, -2.483154296875, -2.1767578125, -1.870361328125, -1.56396484375, -1.257568359375, -0.951171875, -0.644775390625, -0.33837890625, -0.031982421875, 0.2744140625, 0.580810546875, 0.88720703125, 1.193603515625, 1.5, 1.806396484375, 2.11279296875, 2.419189453125, 2.7255859375, 3.031982421875, 3.33837890625, 3.644775390625, 3.951171875, 4.257568359375, 4.56396484375, 4.870361328125, 5.1767578125, 5.483154296875, 5.78955078125, 6.095947265625, 6.40234375, 6.708740234375, 7.01513671875, 7.321533203125, 7.6279296875, 7.934326171875, 8.24072265625, 8.547119140625, 8.853515625, 9.159912109375, 9.46630859375, 9.772705078125, 10.0791015625, 10.385498046875, 10.69189453125, 10.998291015625, 11.3046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 16.0, 24.0, 25.0, 50.0, 64.0, 104.0, 145.0, 231.0, 342.0, 564.0, 772.0, 1160.0, 1711.0, 2705.0, 4252.0, 6413.0, 9911.0, 15485.0, 24226.0, 38638.0, 62463.0, 104673.0, 183509.0, 1280242.0, 140935.0, 81960.0, 49974.0, 31659.0, 19523.0, 12292.0, 7853.0, 5103.0, 3490.0, 2197.0, 1482.0, 947.0, 650.0, 437.0, 316.0, 180.0, 123.0, 97.0, 58.0, 44.0, 30.0, 15.0, 15.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.149658203125, -0.14487266540527344, -0.14008712768554688, -0.1353015899658203, -0.13051605224609375, -0.1257305145263672, -0.12094497680664062, -0.11615943908691406, -0.1113739013671875, -0.10658836364746094, -0.10180282592773438, -0.09701728820800781, -0.09223175048828125, -0.08744621276855469, -0.08266067504882812, -0.07787513732910156, -0.073089599609375, -0.06830406188964844, -0.06351852416992188, -0.05873298645019531, -0.05394744873046875, -0.04916191101074219, -0.044376373291015625, -0.03959083557128906, -0.0348052978515625, -0.030019760131835938, -0.025234222412109375, -0.020448684692382812, -0.01566314697265625, -0.010877609252929688, -0.006092071533203125, -0.0013065338134765625, 0.00347900390625, 0.008264541625976562, 0.013050079345703125, 0.017835617065429688, 0.02262115478515625, 0.027406692504882812, 0.032192230224609375, 0.03697776794433594, 0.0417633056640625, 0.04654884338378906, 0.051334381103515625, 0.05611991882324219, 0.06090545654296875, 0.06569099426269531, 0.07047653198242188, 0.07526206970214844, 0.080047607421875, 0.08483314514160156, 0.08961868286132812, 0.09440422058105469, 0.09918975830078125, 0.10397529602050781, 0.10876083374023438, 0.11354637145996094, 0.1183319091796875, 0.12311744689941406, 0.12790298461914062, 0.1326885223388672, 0.13747406005859375, 0.1422595977783203, 0.14704513549804688, 0.15183067321777344, 0.1566162109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 3.0, 9.0, 4.0, 9.0, 16.0, 17.0, 22.0, 31.0, 18.0, 25.0, 29.0, 36.0, 33.0, 40.0, 51.0, 80.0, 87.0, 91.0, 63.0, 54.0, 36.0, 25.0, 37.0, 27.0, 28.0, 19.0, 21.0, 10.0, 5.0, 5.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00025081634521484375, -0.00024335645139217377, -0.00023589655756950378, -0.0002284366637468338, -0.00022097676992416382, -0.00021351687610149384, -0.00020605698227882385, -0.00019859708845615387, -0.0001911371946334839, -0.0001836773008108139, -0.00017621740698814392, -0.00016875751316547394, -0.00016129761934280396, -0.00015383772552013397, -0.000146377831697464, -0.000138917937874794, -0.00013145804405212402, -0.00012399815022945404, -0.00011653825640678406, -0.00010907836258411407, -0.00010161846876144409, -9.415857493877411e-05, -8.669868111610413e-05, -7.923878729343414e-05, -7.177889347076416e-05, -6.431899964809418e-05, -5.6859105825424194e-05, -4.939921200275421e-05, -4.193931818008423e-05, -3.4479424357414246e-05, -2.7019530534744263e-05, -1.955963671207428e-05, -1.2099742889404297e-05, -4.639849066734314e-06, 2.820044755935669e-06, 1.0279938578605652e-05, 1.7739832401275635e-05, 2.5199726223945618e-05, 3.26596200466156e-05, 4.0119513869285583e-05, 4.7579407691955566e-05, 5.503930151462555e-05, 6.249919533729553e-05, 6.995908915996552e-05, 7.74189829826355e-05, 8.487887680530548e-05, 9.233877062797546e-05, 9.979866445064545e-05, 0.00010725855827331543, 0.00011471845209598541, 0.0001221783459186554, 0.00012963823974132538, 0.00013709813356399536, 0.00014455802738666534, 0.00015201792120933533, 0.0001594778150320053, 0.0001669377088546753, 0.00017439760267734528, 0.00018185749650001526, 0.00018931739032268524, 0.00019677728414535522, 0.0002042371779680252, 0.0002116970717906952, 0.00021915696561336517, 0.00022661685943603516]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 7.0, 11.0, 7.0, 12.0, 18.0, 28.0, 41.0, 38.0, 42.0, 96.0, 121.0, 180.0, 361.0, 854.0, 59077.0, 984710.0, 1652.0, 479.0, 230.0, 133.0, 99.0, 81.0, 39.0, 36.0, 34.0, 33.0, 24.0, 18.0, 9.0, 9.0, 9.0, 5.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054473876953125, -0.00527268648147583, -0.00509798526763916, -0.00492328405380249, -0.00474858283996582, -0.00457388162612915, -0.0043991804122924805, -0.0042244791984558105, -0.004049777984619141, -0.0038750767707824707, -0.0037003755569458008, -0.003525674343109131, -0.003350973129272461, -0.003176271915435791, -0.003001570701599121, -0.002826869487762451, -0.0026521682739257812, -0.0024774670600891113, -0.0023027658462524414, -0.0021280646324157715, -0.0019533634185791016, -0.0017786622047424316, -0.0016039609909057617, -0.0014292597770690918, -0.0012545585632324219, -0.001079857349395752, -0.000905156135559082, -0.0007304549217224121, -0.0005557537078857422, -0.00038105249404907227, -0.00020635128021240234, -3.165006637573242e-05, 0.0001430511474609375, 0.0003177523612976074, 0.0004924535751342773, 0.0006671547889709473, 0.0008418560028076172, 0.0010165572166442871, 0.001191258430480957, 0.001365959644317627, 0.0015406608581542969, 0.0017153620719909668, 0.0018900632858276367, 0.0020647644996643066, 0.0022394657135009766, 0.0024141669273376465, 0.0025888681411743164, 0.0027635693550109863, 0.0029382705688476562, 0.003112971782684326, 0.003287672996520996, 0.003462374210357666, 0.003637075424194336, 0.003811776638031006, 0.003986477851867676, 0.004161179065704346, 0.004335880279541016, 0.0045105814933776855, 0.0046852827072143555, 0.004859983921051025, 0.005034685134887695, 0.005209386348724365, 0.005384087562561035, 0.005558788776397705, 0.005733489990234375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 762.0, 253.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008890714962035418, -0.0006648646667599678, -0.00044065777910873294, -0.00021645089145749807, 7.755937986075878e-06, 0.00023196276742964983, 0.0004561697132885456, 0.0006803765427321196, 0.0009045833721756935, 0.0011287902016192675, 0.0013529970310628414, 0.0015772039769217372, 0.0018014108063653111, 0.002025617752224207, 0.002249824581667781, 0.002474031411111355, 0.0026982382405549288, 0.0029224450699985027, 0.0031466518994420767, 0.0033708587288856506, 0.0035950657911598682, 0.0038192723877727985, 0.004043479450047016, 0.0042676860466599464, 0.004491893108934164, 0.004716100171208382, 0.004940306767821312, 0.0051645138300955296, 0.00538872042670846, 0.0056129274889826775, 0.005837134085595608, 0.006061341147869825, 0.006285548210144043, 0.006509755272418261, 0.006733961869031191, 0.0069581689313054085, 0.007182375527918339, 0.007406582590192556, 0.007630789652466774, 0.007854996249079704, 0.008079202845692635, 0.008303409442305565, 0.00852761697024107, 0.008751823566854, 0.00897603016346693, 0.00920023676007986, 0.009424444288015366, 0.009648650884628296, 0.009872857481241226, 0.010097064077854156, 0.010321271605789661, 0.010545478202402592, 0.010769684799015522, 0.010993891395628452, 0.011218098923563957, 0.011442305520176888, 0.011666513048112392, 0.011890719644725323, 0.012114927172660828, 0.012339133769273758, 0.012563340365886688, 0.012787546962499619, 0.013011754490435123, 0.013235961087048054, 0.013460167683660984]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 8.0, 36.0, 55.0, 79.0, 122.0, 148.0, 142.0, 129.0, 116.0, 69.0, 51.0, 32.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005792379379272461, -0.0005623642355203629, -0.0005454905331134796, -0.0005286168307065964, -0.0005117431282997131, -0.0004948694258928299, -0.00047799572348594666, -0.0004611220210790634, -0.0004442483186721802, -0.00042737461626529694, -0.0004105009138584137, -0.00039362721145153046, -0.0003767535090446472, -0.000359879806637764, -0.00034300610423088074, -0.0003261324018239975, -0.00030925869941711426, -0.000292384997010231, -0.0002755112946033478, -0.00025863759219646454, -0.0002417638897895813, -0.00022489018738269806, -0.00020801648497581482, -0.00019114278256893158, -0.00017426908016204834, -0.0001573953777551651, -0.00014052167534828186, -0.00012364797294139862, -0.00010677427053451538, -8.990056812763214e-05, -7.30268657207489e-05, -5.615316331386566e-05, -3.927946090698242e-05, -2.2405758500099182e-05, -5.532056093215942e-06, 1.1341646313667297e-05, 2.8215348720550537e-05, 4.508905112743378e-05, 6.196275353431702e-05, 7.883645594120026e-05, 9.57101583480835e-05, 0.00011258386075496674, 0.00012945756316184998, 0.00014633126556873322, 0.00016320496797561646, 0.0001800786703824997, 0.00019695237278938293, 0.00021382607519626617, 0.00023069977760314941, 0.00024757348001003265, 0.0002644471824169159, 0.00028132088482379913, 0.0002981945872306824, 0.0003150682896375656, 0.00033194199204444885, 0.0003488156944513321, 0.00036568939685821533, 0.00038256309926509857, 0.0003994368016719818, 0.00041631050407886505, 0.0004331842064857483, 0.00045005790889263153, 0.00046693161129951477, 0.000483805313706398, 0.0005006790161132812]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 4.0, 12.0, 3.0, 27.0, 24.0, 40.0, 42.0, 73.0, 108.0, 157.0, 227.0, 346.0, 516.0, 763.0, 1288.0, 2206.0, 3845.0, 7485.0, 16790.0, 50815.0, 253627.0, 555553.0, 103706.0, 27556.0, 10792.0, 5174.0, 2746.0, 1621.0, 1021.0, 640.0, 457.0, 274.0, 187.0, 133.0, 85.0, 73.0, 45.0, 30.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.09375, -25.308837890625, -24.52392578125, -23.739013671875, -22.9541015625, -22.169189453125, -21.38427734375, -20.599365234375, -19.814453125, -19.029541015625, -18.24462890625, -17.459716796875, -16.6748046875, -15.889892578125, -15.10498046875, -14.320068359375, -13.53515625, -12.750244140625, -11.96533203125, -11.180419921875, -10.3955078125, -9.610595703125, -8.82568359375, -8.040771484375, -7.255859375, -6.470947265625, -5.68603515625, -4.901123046875, -4.1162109375, -3.331298828125, -2.54638671875, -1.761474609375, -0.9765625, -0.191650390625, 0.59326171875, 1.378173828125, 2.1630859375, 2.947998046875, 3.73291015625, 4.517822265625, 5.302734375, 6.087646484375, 6.87255859375, 7.657470703125, 8.4423828125, 9.227294921875, 10.01220703125, 10.797119140625, 11.58203125, 12.366943359375, 13.15185546875, 13.936767578125, 14.7216796875, 15.506591796875, 16.29150390625, 17.076416015625, 17.861328125, 18.646240234375, 19.43115234375, 20.216064453125, 21.0009765625, 21.785888671875, 22.57080078125, 23.355712890625, 24.140625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 13.0, 16.0, 23.0, 15.0, 23.0, 33.0, 23.0, 40.0, 42.0, 43.0, 78.0, 71.0, 204.0, 1592.0, 278.0, 96.0, 64.0, 50.0, 41.0, 33.0, 38.0, 32.0, 37.0, 22.0, 12.0, 20.0, 12.0, 11.0, 13.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-42.125, -41.035400390625, -39.94580078125, -38.856201171875, -37.7666015625, -36.677001953125, -35.58740234375, -34.497802734375, -33.408203125, -32.318603515625, -31.22900390625, -30.139404296875, -29.0498046875, -27.960205078125, -26.87060546875, -25.781005859375, -24.69140625, -23.601806640625, -22.51220703125, -21.422607421875, -20.3330078125, -19.243408203125, -18.15380859375, -17.064208984375, -15.974609375, -14.885009765625, -13.79541015625, -12.705810546875, -11.6162109375, -10.526611328125, -9.43701171875, -8.347412109375, -7.2578125, -6.168212890625, -5.07861328125, -3.989013671875, -2.8994140625, -1.809814453125, -0.72021484375, 0.369384765625, 1.458984375, 2.548583984375, 3.63818359375, 4.727783203125, 5.8173828125, 6.906982421875, 7.99658203125, 9.086181640625, 10.17578125, 11.265380859375, 12.35498046875, 13.444580078125, 14.5341796875, 15.623779296875, 16.71337890625, 17.802978515625, 18.892578125, 19.982177734375, 21.07177734375, 22.161376953125, 23.2509765625, 24.340576171875, 25.43017578125, 26.519775390625, 27.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 13.0, 15.0, 29.0, 36.0, 57.0, 66.0, 108.0, 147.0, 261.0, 468.0, 1336.0, 13897.0, 3086227.0, 39530.0, 2045.0, 553.0, 316.0, 168.0, 113.0, 88.0, 55.0, 38.0, 26.0, 16.0, 14.0, 16.0, 12.0, 10.0, 2.0, 6.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.25, -97.3544921875, -94.458984375, -91.5634765625, -88.66796875, -85.7724609375, -82.876953125, -79.9814453125, -77.0859375, -74.1904296875, -71.294921875, -68.3994140625, -65.50390625, -62.6083984375, -59.712890625, -56.8173828125, -53.921875, -51.0263671875, -48.130859375, -45.2353515625, -42.33984375, -39.4443359375, -36.548828125, -33.6533203125, -30.7578125, -27.8623046875, -24.966796875, -22.0712890625, -19.17578125, -16.2802734375, -13.384765625, -10.4892578125, -7.59375, -4.6982421875, -1.802734375, 1.0927734375, 3.98828125, 6.8837890625, 9.779296875, 12.6748046875, 15.5703125, 18.4658203125, 21.361328125, 24.2568359375, 27.15234375, 30.0478515625, 32.943359375, 35.8388671875, 38.734375, 41.6298828125, 44.525390625, 47.4208984375, 50.31640625, 53.2119140625, 56.107421875, 59.0029296875, 61.8984375, 64.7939453125, 67.689453125, 70.5849609375, 73.48046875, 76.3759765625, 79.271484375, 82.1669921875, 85.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 33.0, 63.0, 120.0, 201.0, 241.0, 152.0, 85.0, 51.0, 19.0, 13.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.17568969726562, -95.25472259521484, -91.33375549316406, -87.41278839111328, -83.4918212890625, -79.57085418701172, -75.64988708496094, -71.72892761230469, -67.80795288085938, -63.886985778808594, -59.96601867675781, -56.04505157470703, -52.12408447265625, -48.20311737060547, -44.28215408325195, -40.36118698120117, -36.440223693847656, -32.519256591796875, -28.598289489746094, -24.677324295043945, -20.756357192993164, -16.835390090942383, -12.914424896240234, -8.993457794189453, -5.072490692138672, -1.1515240669250488, 2.769442558288574, 6.690408706665039, 10.61137580871582, 14.532342910766602, 18.45330810546875, 22.37427520751953, 26.295242309570312, 30.216209411621094, 34.137176513671875, 38.058143615722656, 41.97911071777344, 45.90007781982422, 49.821041107177734, 53.742008209228516, 57.6629753112793, 61.58394241333008, 65.5049057006836, 69.42587280273438, 73.34683990478516, 77.26780700683594, 81.18877410888672, 85.1097412109375, 89.03070831298828, 92.95167541503906, 96.87264251708984, 100.79360961914062, 104.7145767211914, 108.63554382324219, 112.55650329589844, 116.47747802734375, 120.3984375, 124.31940460205078, 128.24037170410156, 132.1613311767578, 136.08230590820312, 140.00326538085938, 143.9242401123047, 147.84519958496094, 151.76617431640625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 10.0, 9.0, 8.0, 10.0, 7.0, 13.0, 6.0, 24.0, 22.0, 20.0, 37.0, 43.0, 33.0, 38.0, 34.0, 33.0, 47.0, 56.0, 41.0, 48.0, 44.0, 44.0, 39.0, 48.0, 41.0, 28.0, 24.0, 30.0, 27.0, 18.0, 18.0, 15.0, 15.0, 11.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-102.04652404785156, -98.91427612304688, -95.78202819824219, -92.6497802734375, -89.51753234863281, -86.38528442382812, -83.25303649902344, -80.12078094482422, -76.98853302001953, -73.85628509521484, -70.72403717041016, -67.59178924560547, -64.45954132080078, -61.32728958129883, -58.19504165649414, -55.06278991699219, -51.930545806884766, -48.79829788208008, -45.66604995727539, -42.53379821777344, -39.40155029296875, -36.26930236816406, -33.137054443359375, -30.004804611206055, -26.872556686401367, -23.74030876159668, -20.60805892944336, -17.475811004638672, -14.343562126159668, -11.211313247680664, -8.079065322875977, -4.946815490722656, -1.8145675659179688, 1.317681074142456, 4.449929714202881, 7.582178115844727, 10.71442699432373, 13.846675872802734, 16.978923797607422, 20.111173629760742, 23.24342155456543, 26.375669479370117, 29.507919311523438, 32.640167236328125, 35.77241516113281, 38.9046630859375, 42.03691101074219, 45.16916275024414, 48.30141067504883, 51.433658599853516, 54.5659065246582, 57.698158264160156, 60.830406188964844, 63.96265411376953, 67.09490203857422, 70.2271499633789, 73.3593978881836, 76.49164581298828, 79.62389373779297, 82.75614166259766, 85.88838958740234, 89.02064514160156, 92.15289306640625, 95.28514099121094, 98.41738891601562]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 2.0, 14.0, 11.0, 11.0, 24.0, 29.0, 23.0, 23.0, 23.0, 41.0, 31.0, 38.0, 39.0, 35.0, 42.0, 61.0, 34.0, 46.0, 57.0, 51.0, 40.0, 39.0, 45.0, 34.0, 37.0, 29.0, 16.0, 27.0, 19.0, 17.0, 7.0, 9.0, 7.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7890625, -14.2735595703125, -13.758056640625, -13.2425537109375, -12.72705078125, -12.2115478515625, -11.696044921875, -11.1805419921875, -10.6650390625, -10.1495361328125, -9.634033203125, -9.1185302734375, -8.60302734375, -8.0875244140625, -7.572021484375, -7.0565185546875, -6.541015625, -6.0255126953125, -5.510009765625, -4.9945068359375, -4.47900390625, -3.9635009765625, -3.447998046875, -2.9324951171875, -2.4169921875, -1.9014892578125, -1.385986328125, -0.8704833984375, -0.35498046875, 0.1605224609375, 0.676025390625, 1.1915283203125, 1.70703125, 2.2225341796875, 2.738037109375, 3.2535400390625, 3.76904296875, 4.2845458984375, 4.800048828125, 5.3155517578125, 5.8310546875, 6.3465576171875, 6.862060546875, 7.3775634765625, 7.89306640625, 8.4085693359375, 8.924072265625, 9.4395751953125, 9.955078125, 10.4705810546875, 10.986083984375, 11.5015869140625, 12.01708984375, 12.5325927734375, 13.048095703125, 13.5635986328125, 14.0791015625, 14.5946044921875, 15.110107421875, 15.6256103515625, 16.14111328125, 16.6566162109375, 17.172119140625, 17.6876220703125, 18.203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 15.0, 31.0, 21.0, 46.0, 68.0, 83.0, 107.0, 141.0, 226.0, 314.0, 407.0, 634.0, 917.0, 1403.0, 2312.0, 4623.0, 14202.0, 134669.0, 1975508.0, 1892413.0, 140661.0, 14063.0, 4569.0, 2373.0, 1411.0, 961.0, 622.0, 435.0, 321.0, 217.0, 134.0, 105.0, 75.0, 39.0, 44.0, 24.0, 23.0, 16.0, 8.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.53125, -34.544189453125, -33.55712890625, -32.570068359375, -31.5830078125, -30.595947265625, -29.60888671875, -28.621826171875, -27.634765625, -26.647705078125, -25.66064453125, -24.673583984375, -23.6865234375, -22.699462890625, -21.71240234375, -20.725341796875, -19.73828125, -18.751220703125, -17.76416015625, -16.777099609375, -15.7900390625, -14.802978515625, -13.81591796875, -12.828857421875, -11.841796875, -10.854736328125, -9.86767578125, -8.880615234375, -7.8935546875, -6.906494140625, -5.91943359375, -4.932373046875, -3.9453125, -2.958251953125, -1.97119140625, -0.984130859375, 0.0029296875, 0.989990234375, 1.97705078125, 2.964111328125, 3.951171875, 4.938232421875, 5.92529296875, 6.912353515625, 7.8994140625, 8.886474609375, 9.87353515625, 10.860595703125, 11.84765625, 12.834716796875, 13.82177734375, 14.808837890625, 15.7958984375, 16.782958984375, 17.77001953125, 18.757080078125, 19.744140625, 20.731201171875, 21.71826171875, 22.705322265625, 23.6923828125, 24.679443359375, 25.66650390625, 26.653564453125, 27.640625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 14.0, 27.0, 29.0, 52.0, 92.0, 102.0, 197.0, 311.0, 586.0, 864.0, 771.0, 417.0, 226.0, 140.0, 77.0, 46.0, 35.0, 22.0, 24.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.828125, -22.825927734375, -21.82373046875, -20.821533203125, -19.8193359375, -18.817138671875, -17.81494140625, -16.812744140625, -15.810546875, -14.808349609375, -13.80615234375, -12.803955078125, -11.8017578125, -10.799560546875, -9.79736328125, -8.795166015625, -7.79296875, -6.790771484375, -5.78857421875, -4.786376953125, -3.7841796875, -2.781982421875, -1.77978515625, -0.777587890625, 0.224609375, 1.226806640625, 2.22900390625, 3.231201171875, 4.2333984375, 5.235595703125, 6.23779296875, 7.239990234375, 8.2421875, 9.244384765625, 10.24658203125, 11.248779296875, 12.2509765625, 13.253173828125, 14.25537109375, 15.257568359375, 16.259765625, 17.261962890625, 18.26416015625, 19.266357421875, 20.2685546875, 21.270751953125, 22.27294921875, 23.275146484375, 24.27734375, 25.279541015625, 26.28173828125, 27.283935546875, 28.2861328125, 29.288330078125, 30.29052734375, 31.292724609375, 32.294921875, 33.297119140625, 34.29931640625, 35.301513671875, 36.3037109375, 37.305908203125, 38.30810546875, 39.310302734375, 40.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 24.0, 29.0, 42.0, 65.0, 136.0, 271.0, 754.0, 3018.0, 25459.0, 2422307.0, 1715122.0, 22746.0, 2814.0, 803.0, 314.0, 150.0, 80.0, 47.0, 32.0, 21.0, 8.0, 13.0, 10.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.3125, -76.4013671875, -74.490234375, -72.5791015625, -70.66796875, -68.7568359375, -66.845703125, -64.9345703125, -63.0234375, -61.1123046875, -59.201171875, -57.2900390625, -55.37890625, -53.4677734375, -51.556640625, -49.6455078125, -47.734375, -45.8232421875, -43.912109375, -42.0009765625, -40.08984375, -38.1787109375, -36.267578125, -34.3564453125, -32.4453125, -30.5341796875, -28.623046875, -26.7119140625, -24.80078125, -22.8896484375, -20.978515625, -19.0673828125, -17.15625, -15.2451171875, -13.333984375, -11.4228515625, -9.51171875, -7.6005859375, -5.689453125, -3.7783203125, -1.8671875, 0.0439453125, 1.955078125, 3.8662109375, 5.77734375, 7.6884765625, 9.599609375, 11.5107421875, 13.421875, 15.3330078125, 17.244140625, 19.1552734375, 21.06640625, 22.9775390625, 24.888671875, 26.7998046875, 28.7109375, 30.6220703125, 32.533203125, 34.4443359375, 36.35546875, 38.2666015625, 40.177734375, 42.0888671875, 44.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 109.0, 420.0, 402.0, 61.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.65985107421875, -206.4739227294922, -194.28799438476562, -182.10208129882812, -169.91615295410156, -157.730224609375, -145.5443115234375, -133.35838317871094, -121.17245483398438, -108.98652648925781, -96.80060577392578, -84.61468505859375, -72.42875671386719, -60.24283218383789, -48.056907653808594, -35.87098693847656, -23.68505859375, -11.499134063720703, 0.6867904663085938, 12.87271499633789, 25.058639526367188, 37.244564056396484, 49.43048858642578, 61.61640930175781, 73.80233764648438, 85.98826599121094, 98.17418670654297, 110.360107421875, 122.54603576660156, 134.73196411132812, 146.91787719726562, 159.1038055419922, 171.28973388671875, 183.4756622314453, 195.66159057617188, 207.84750366210938, 220.03343200683594, 232.2193603515625, 244.4052734375, 256.5911865234375, 268.7771301269531, 280.9630432128906, 293.14898681640625, 305.33489990234375, 317.52081298828125, 329.7067565917969, 341.8926696777344, 354.07861328125, 366.2645263671875, 378.450439453125, 390.6363830566406, 402.8222961425781, 415.00823974609375, 427.19415283203125, 439.38006591796875, 451.56597900390625, 463.7519226074219, 475.9378356933594, 488.123779296875, 500.3096923828125, 512.49560546875, 524.6815185546875, 536.8674926757812, 549.0534057617188, 561.2393188476562]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 7.0, 7.0, 12.0, 16.0, 8.0, 23.0, 20.0, 26.0, 15.0, 32.0, 29.0, 40.0, 35.0, 43.0, 44.0, 35.0, 38.0, 39.0, 46.0, 44.0, 42.0, 46.0, 46.0, 37.0, 32.0, 34.0, 33.0, 23.0, 23.0, 16.0, 8.0, 13.0, 15.0, 9.0, 14.0, 10.0, 7.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.37522888183594, -77.98039245605469, -75.58555603027344, -73.19071960449219, -70.79588317871094, -68.40104675292969, -66.00621032714844, -63.61137008666992, -61.21653366088867, -58.82169723510742, -56.42686080932617, -54.03202438354492, -51.637184143066406, -49.242347717285156, -46.847511291503906, -44.452674865722656, -42.057838439941406, -39.663002014160156, -37.268165588378906, -34.873329162597656, -32.478492736816406, -30.083654403686523, -27.68881607055664, -25.29397964477539, -22.89914321899414, -20.50430679321289, -18.10947036743164, -15.714632034301758, -13.319795608520508, -10.924959182739258, -8.530121803283691, -6.135284423828125, -3.740447998046875, -1.3456110954284668, 1.0492258071899414, 3.4440627098083496, 5.838899612426758, 8.233736038208008, 10.628573417663574, 13.02341079711914, 15.41824722290039, 17.81308364868164, 20.20792007446289, 22.602758407592773, 24.997594833374023, 27.392431259155273, 29.787269592285156, 32.182106018066406, 34.576942443847656, 36.971778869628906, 39.366615295410156, 41.761451721191406, 44.156288146972656, 46.551124572753906, 48.94596481323242, 51.34080123901367, 53.73563766479492, 56.13047409057617, 58.52531051635742, 60.92014694213867, 63.31498718261719, 65.70982360839844, 68.10466003417969, 70.49949645996094, 72.89433288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 11.0, 14.0, 18.0, 28.0, 33.0, 67.0, 93.0, 124.0, 225.0, 296.0, 469.0, 732.0, 1040.0, 1721.0, 2670.0, 4078.0, 6698.0, 10578.0, 17010.0, 26867.0, 44593.0, 73476.0, 124750.0, 223719.0, 211548.0, 117223.0, 69563.0, 41593.0, 25664.0, 16172.0, 10011.0, 6222.0, 3993.0, 2496.0, 1600.0, 1077.0, 708.0, 461.0, 297.0, 221.0, 130.0, 84.0, 51.0, 56.0, 22.0, 17.0, 14.0, 9.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2110595703125, -0.2042388916015625, -0.197418212890625, -0.1905975341796875, -0.18377685546875, -0.1769561767578125, -0.170135498046875, -0.1633148193359375, -0.156494140625, -0.1496734619140625, -0.142852783203125, -0.1360321044921875, -0.12921142578125, -0.1223907470703125, -0.115570068359375, -0.1087493896484375, -0.1019287109375, -0.0951080322265625, -0.088287353515625, -0.0814666748046875, -0.07464599609375, -0.0678253173828125, -0.061004638671875, -0.0541839599609375, -0.04736328125, -0.0405426025390625, -0.033721923828125, -0.0269012451171875, -0.02008056640625, -0.0132598876953125, -0.006439208984375, 0.0003814697265625, 0.0072021484375, 0.0140228271484375, 0.020843505859375, 0.0276641845703125, 0.03448486328125, 0.0413055419921875, 0.048126220703125, 0.0549468994140625, 0.061767578125, 0.0685882568359375, 0.075408935546875, 0.0822296142578125, 0.08905029296875, 0.0958709716796875, 0.102691650390625, 0.1095123291015625, 0.1163330078125, 0.1231536865234375, 0.129974365234375, 0.1367950439453125, 0.14361572265625, 0.1504364013671875, 0.157257080078125, 0.1640777587890625, 0.1708984375, 0.1777191162109375, 0.184539794921875, 0.1913604736328125, 0.19818115234375, 0.2050018310546875, 0.211822509765625, 0.2186431884765625, 0.2254638671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 15.0, 14.0, 22.0, 27.0, 23.0, 23.0, 31.0, 34.0, 35.0, 38.0, 43.0, 52.0, 41.0, 47.0, 1072.0, 44.0, 39.0, 42.0, 36.0, 33.0, 35.0, 31.0, 28.0, 27.0, 30.0, 22.0, 10.0, 20.0, 12.0, 21.0, 10.0, 3.0, 9.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.3912353515625, -8.110595703125, -7.8299560546875, -7.54931640625, -7.2686767578125, -6.988037109375, -6.7073974609375, -6.4267578125, -6.1461181640625, -5.865478515625, -5.5848388671875, -5.30419921875, -5.0235595703125, -4.742919921875, -4.4622802734375, -4.181640625, -3.9010009765625, -3.620361328125, -3.3397216796875, -3.05908203125, -2.7784423828125, -2.497802734375, -2.2171630859375, -1.9365234375, -1.6558837890625, -1.375244140625, -1.0946044921875, -0.81396484375, -0.5333251953125, -0.252685546875, 0.0279541015625, 0.30859375, 0.5892333984375, 0.869873046875, 1.1505126953125, 1.43115234375, 1.7117919921875, 1.992431640625, 2.2730712890625, 2.5537109375, 2.8343505859375, 3.114990234375, 3.3956298828125, 3.67626953125, 3.9569091796875, 4.237548828125, 4.5181884765625, 4.798828125, 5.0794677734375, 5.360107421875, 5.6407470703125, 5.92138671875, 6.2020263671875, 6.482666015625, 6.7633056640625, 7.0439453125, 7.3245849609375, 7.605224609375, 7.8858642578125, 8.16650390625, 8.4471435546875, 8.727783203125, 9.0084228515625, 9.2890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 7.0, 14.0, 25.0, 40.0, 46.0, 75.0, 107.0, 155.0, 228.0, 364.0, 508.0, 776.0, 1308.0, 1840.0, 2731.0, 4153.0, 6305.0, 9780.0, 15446.0, 24691.0, 40232.0, 65637.0, 112469.0, 201314.0, 1277942.0, 131531.0, 75656.0, 45967.0, 28421.0, 17429.0, 11158.0, 7146.0, 4595.0, 3034.0, 2013.0, 1256.0, 851.0, 585.0, 443.0, 310.0, 211.0, 97.0, 68.0, 48.0, 35.0, 25.0, 21.0, 14.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.1337451934814453, -0.12930679321289062, -0.12486839294433594, -0.12042999267578125, -0.11599159240722656, -0.11155319213867188, -0.10711479187011719, -0.1026763916015625, -0.09823799133300781, -0.09379959106445312, -0.08936119079589844, -0.08492279052734375, -0.08048439025878906, -0.07604598999023438, -0.07160758972167969, -0.067169189453125, -0.06273078918457031, -0.058292388916015625, -0.05385398864746094, -0.04941558837890625, -0.04497718811035156, -0.040538787841796875, -0.03610038757324219, -0.0316619873046875, -0.027223587036132812, -0.022785186767578125, -0.018346786499023438, -0.01390838623046875, -0.009469985961914062, -0.005031585693359375, -0.0005931854248046875, 0.00384521484375, 0.008283615112304688, 0.012722015380859375, 0.017160415649414062, 0.02159881591796875, 0.026037216186523438, 0.030475616455078125, 0.03491401672363281, 0.0393524169921875, 0.04379081726074219, 0.048229217529296875, 0.05266761779785156, 0.05710601806640625, 0.06154441833496094, 0.06598281860351562, 0.07042121887207031, 0.074859619140625, 0.07929801940917969, 0.08373641967773438, 0.08817481994628906, 0.09261322021484375, 0.09705162048339844, 0.10149002075195312, 0.10592842102050781, 0.1103668212890625, 0.11480522155761719, 0.11924362182617188, 0.12368202209472656, 0.12812042236328125, 0.13255882263183594, 0.13699722290039062, 0.1414356231689453, 0.1458740234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 5.0, 12.0, 5.0, 17.0, 16.0, 19.0, 24.0, 31.0, 33.0, 49.0, 42.0, 66.0, 62.0, 70.0, 86.0, 63.0, 46.0, 55.0, 39.0, 50.0, 41.0, 21.0, 22.0, 24.0, 27.0, 13.0, 4.0, 4.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001347064971923828, -0.0001301206648349762, -0.00012553483247756958, -0.00012094900012016296, -0.00011636316776275635, -0.00011177733540534973, -0.00010719150304794312, -0.0001026056706905365, -9.801983833312988e-05, -9.343400597572327e-05, -8.884817361831665e-05, -8.426234126091003e-05, -7.967650890350342e-05, -7.50906765460968e-05, -7.050484418869019e-05, -6.591901183128357e-05, -6.133317947387695e-05, -5.674734711647034e-05, -5.216151475906372e-05, -4.7575682401657104e-05, -4.298985004425049e-05, -3.840401768684387e-05, -3.3818185329437256e-05, -2.923235297203064e-05, -2.4646520614624023e-05, -2.0060688257217407e-05, -1.547485589981079e-05, -1.0889023542404175e-05, -6.303191184997559e-06, -1.7173588275909424e-06, 2.868473529815674e-06, 7.45430588722229e-06, 1.2040138244628906e-05, 1.6625970602035522e-05, 2.121180295944214e-05, 2.5797635316848755e-05, 3.038346767425537e-05, 3.496930003166199e-05, 3.9555132389068604e-05, 4.414096474647522e-05, 4.8726797103881836e-05, 5.331262946128845e-05, 5.789846181869507e-05, 6.248429417610168e-05, 6.70701265335083e-05, 7.165595889091492e-05, 7.624179124832153e-05, 8.082762360572815e-05, 8.541345596313477e-05, 8.999928832054138e-05, 9.4585120677948e-05, 9.917095303535461e-05, 0.00010375678539276123, 0.00010834261775016785, 0.00011292845010757446, 0.00011751428246498108, 0.0001221001148223877, 0.0001266859471797943, 0.00013127177953720093, 0.00013585761189460754, 0.00014044344425201416, 0.00014502927660942078, 0.0001496151089668274, 0.000154200941324234, 0.00015878677368164062]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 11.0, 6.0, 12.0, 21.0, 39.0, 27.0, 40.0, 72.0, 104.0, 139.0, 233.0, 446.0, 1320.0, 152831.0, 889387.0, 2443.0, 537.0, 282.0, 170.0, 113.0, 76.0, 43.0, 39.0, 32.0, 24.0, 13.0, 12.0, 10.0, 10.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0034618377685546875, -0.003360360860824585, -0.0032588839530944824, -0.00315740704536438, -0.0030559301376342773, -0.002954453229904175, -0.0028529763221740723, -0.0027514994144439697, -0.002650022506713867, -0.0025485455989837646, -0.002447068691253662, -0.0023455917835235596, -0.002244114875793457, -0.0021426379680633545, -0.002041161060333252, -0.0019396841526031494, -0.0018382072448730469, -0.0017367303371429443, -0.0016352534294128418, -0.0015337765216827393, -0.0014322996139526367, -0.0013308227062225342, -0.0012293457984924316, -0.001127868890762329, -0.0010263919830322266, -0.000924915075302124, -0.0008234381675720215, -0.0007219612598419189, -0.0006204843521118164, -0.0005190074443817139, -0.00041753053665161133, -0.0003160536289215088, -0.00021457672119140625, -0.00011309981346130371, -1.1622905731201172e-05, 8.985400199890137e-05, 0.0001913309097290039, 0.00029280781745910645, 0.000394284725189209, 0.0004957616329193115, 0.0005972385406494141, 0.0006987154483795166, 0.0008001923561096191, 0.0009016692638397217, 0.0010031461715698242, 0.0011046230792999268, 0.0012060999870300293, 0.0013075768947601318, 0.0014090538024902344, 0.001510530710220337, 0.0016120076179504395, 0.001713484525680542, 0.0018149614334106445, 0.001916438341140747, 0.0020179152488708496, 0.002119392156600952, 0.0022208690643310547, 0.0023223459720611572, 0.0024238228797912598, 0.0025252997875213623, 0.002626776695251465, 0.0027282536029815674, 0.00282973051071167, 0.0029312074184417725, 0.003032684326171875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 106.0, 909.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045334320748224854, -0.0003064321062993258, -0.0001595210051164031, -1.2609903933480382e-05, 0.00013430119724944234, 0.0002812123275361955, 0.0004281233996152878, 0.00057503447169438, 0.0007219456019811332, 0.0008688566740602255, 0.0010157678043469787, 0.0011626789346337318, 0.0013095899485051632, 0.0014565011952072382, 0.0016034122090786695, 0.001750323222950101, 0.001897234469652176, 0.0020441454835236073, 0.0021910567302256823, 0.0023379677440971136, 0.0024848789907991886, 0.00263179000467062, 0.0027787010185420513, 0.0029256120324134827, 0.0030725232791155577, 0.003219434292986989, 0.003366345539689064, 0.0035132565535604954, 0.0036601675674319267, 0.0038070788141340017, 0.003953990060836077, 0.004100901074707508, 0.004247811622917652, 0.0043947226367890835, 0.004541633650660515, 0.0046885451301932335, 0.004835456144064665, 0.004982367157936096, 0.0051292781718075275, 0.005276189185678959, 0.0054231006652116776, 0.005570011679083109, 0.00571692269295454, 0.005863834172487259, 0.00601074518635869, 0.006157656200230122, 0.006304567214101553, 0.006451478227972984, 0.006598389241844416, 0.006745300255715847, 0.006892211269587278, 0.007039122749119997, 0.007186033762991428, 0.00733294477686286, 0.007479855790734291, 0.007626766804605722, 0.007773677818477154, 0.007920589298009872, 0.008067499846220016, 0.008214411325752735, 0.00836132187396288, 0.008508233353495598, 0.008655144833028316, 0.00880205538123846, 0.00894896686077118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 17.0, 21.0, 56.0, 89.0, 147.0, 174.0, 178.0, 133.0, 100.0, 51.0, 24.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040650367736816406, -0.0003951890394091606, -0.00038387440145015717, -0.0003725597634911537, -0.00036124512553215027, -0.0003499304875731468, -0.00033861584961414337, -0.0003273012116551399, -0.0003159865736961365, -0.000304671935737133, -0.0002933572977781296, -0.00028204265981912613, -0.0002707280218601227, -0.00025941338390111923, -0.0002480987459421158, -0.00023678410798311234, -0.0002254694700241089, -0.00021415483206510544, -0.000202840194106102, -0.00019152555614709854, -0.0001802109181880951, -0.00016889628022909164, -0.0001575816422700882, -0.00014626700431108475, -0.0001349523663520813, -0.00012363772839307785, -0.0001123230904340744, -0.00010100845247507095, -8.96938145160675e-05, -7.837917655706406e-05, -6.706453859806061e-05, -5.574990063905716e-05, -4.443526268005371e-05, -3.312062472105026e-05, -2.1805986762046814e-05, -1.0491348803043365e-05, 8.23289155960083e-07, 1.2137927114963531e-05, 2.345256507396698e-05, 3.476720303297043e-05, 4.608184099197388e-05, 5.7396478950977325e-05, 6.871111690998077e-05, 8.002575486898422e-05, 9.134039282798767e-05, 0.00010265503078699112, 0.00011396966874599457, 0.00012528430670499802, 0.00013659894466400146, 0.0001479135826230049, 0.00015922822058200836, 0.0001705428585410118, 0.00018185749650001526, 0.0001931721344590187, 0.00020448677241802216, 0.0002158014103770256, 0.00022711604833602905, 0.0002384306862950325, 0.00024974532425403595, 0.0002610599622130394, 0.00027237460017204285, 0.0002836892381310463, 0.00029500387609004974, 0.0003063185140490532, 0.00031763315200805664]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 13.0, 12.0, 29.0, 30.0, 42.0, 55.0, 84.0, 132.0, 187.0, 338.0, 606.0, 1086.0, 2269.0, 5365.0, 16682.0, 92460.0, 696774.0, 192545.0, 26369.0, 7386.0, 2857.0, 1376.0, 731.0, 425.0, 228.0, 137.0, 97.0, 64.0, 46.0, 33.0, 18.0, 22.0, 11.0, 9.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.539306640625, -20.81298828125, -20.086669921875, -19.3603515625, -18.634033203125, -17.90771484375, -17.181396484375, -16.455078125, -15.728759765625, -15.00244140625, -14.276123046875, -13.5498046875, -12.823486328125, -12.09716796875, -11.370849609375, -10.64453125, -9.918212890625, -9.19189453125, -8.465576171875, -7.7392578125, -7.012939453125, -6.28662109375, -5.560302734375, -4.833984375, -4.107666015625, -3.38134765625, -2.655029296875, -1.9287109375, -1.202392578125, -0.47607421875, 0.250244140625, 0.9765625, 1.702880859375, 2.42919921875, 3.155517578125, 3.8818359375, 4.608154296875, 5.33447265625, 6.060791015625, 6.787109375, 7.513427734375, 8.23974609375, 8.966064453125, 9.6923828125, 10.418701171875, 11.14501953125, 11.871337890625, 12.59765625, 13.323974609375, 14.05029296875, 14.776611328125, 15.5029296875, 16.229248046875, 16.95556640625, 17.681884765625, 18.408203125, 19.134521484375, 19.86083984375, 20.587158203125, 21.3134765625, 22.039794921875, 22.76611328125, 23.492431640625, 24.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 9.0, 14.0, 12.0, 15.0, 26.0, 19.0, 30.0, 18.0, 30.0, 42.0, 51.0, 75.0, 88.0, 185.0, 1560.0, 322.0, 120.0, 81.0, 53.0, 51.0, 43.0, 28.0, 29.0, 18.0, 23.0, 17.0, 17.0, 14.0, 20.0, 6.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.125, -29.146484375, -28.16796875, -27.189453125, -26.2109375, -25.232421875, -24.25390625, -23.275390625, -22.296875, -21.318359375, -20.33984375, -19.361328125, -18.3828125, -17.404296875, -16.42578125, -15.447265625, -14.46875, -13.490234375, -12.51171875, -11.533203125, -10.5546875, -9.576171875, -8.59765625, -7.619140625, -6.640625, -5.662109375, -4.68359375, -3.705078125, -2.7265625, -1.748046875, -0.76953125, 0.208984375, 1.1875, 2.166015625, 3.14453125, 4.123046875, 5.1015625, 6.080078125, 7.05859375, 8.037109375, 9.015625, 9.994140625, 10.97265625, 11.951171875, 12.9296875, 13.908203125, 14.88671875, 15.865234375, 16.84375, 17.822265625, 18.80078125, 19.779296875, 20.7578125, 21.736328125, 22.71484375, 23.693359375, 24.671875, 25.650390625, 26.62890625, 27.607421875, 28.5859375, 29.564453125, 30.54296875, 31.521484375, 32.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 10.0, 7.0, 21.0, 18.0, 25.0, 25.0, 27.0, 46.0, 75.0, 134.0, 245.0, 470.0, 1249.0, 62772.0, 3076171.0, 2940.0, 695.0, 309.0, 157.0, 81.0, 56.0, 39.0, 31.0, 28.0, 19.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.9375, -83.3505859375, -80.763671875, -78.1767578125, -75.58984375, -73.0029296875, -70.416015625, -67.8291015625, -65.2421875, -62.6552734375, -60.068359375, -57.4814453125, -54.89453125, -52.3076171875, -49.720703125, -47.1337890625, -44.546875, -41.9599609375, -39.373046875, -36.7861328125, -34.19921875, -31.6123046875, -29.025390625, -26.4384765625, -23.8515625, -21.2646484375, -18.677734375, -16.0908203125, -13.50390625, -10.9169921875, -8.330078125, -5.7431640625, -3.15625, -0.5693359375, 2.017578125, 4.6044921875, 7.19140625, 9.7783203125, 12.365234375, 14.9521484375, 17.5390625, 20.1259765625, 22.712890625, 25.2998046875, 27.88671875, 30.4736328125, 33.060546875, 35.6474609375, 38.234375, 40.8212890625, 43.408203125, 45.9951171875, 48.58203125, 51.1689453125, 53.755859375, 56.3427734375, 58.9296875, 61.5166015625, 64.103515625, 66.6904296875, 69.27734375, 71.8642578125, 74.451171875, 77.0380859375, 79.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 198.0, 711.0, 88.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34883117675781, -27.304141998291016, -19.259450912475586, -11.214759826660156, -3.1700706481933594, 4.8746185302734375, 12.9193115234375, 20.964000701904297, 29.008689880371094, 37.05337905883789, 45.09806823730469, 53.14276123046875, 61.18745040893555, 69.23213958740234, 77.2768325805664, 85.32151794433594, 93.3662109375, 101.41090393066406, 109.4555892944336, 117.50028228759766, 125.54496765136719, 133.58966064453125, 141.6343536376953, 149.67904663085938, 157.72372436523438, 165.76841735839844, 173.8131103515625, 181.8577880859375, 189.90248107910156, 197.94717407226562, 205.9918670654297, 214.03656005859375, 222.08126831054688, 230.12596130371094, 238.170654296875, 246.21533203125, 254.26002502441406, 262.3047180175781, 270.34942626953125, 278.39410400390625, 286.43878173828125, 294.48345947265625, 302.5281677246094, 310.5728454589844, 318.6175537109375, 326.6622314453125, 334.7069091796875, 342.7516174316406, 350.79632568359375, 358.84100341796875, 366.8857116699219, 374.9303894042969, 382.97509765625, 391.019775390625, 399.064453125, 407.1091613769531, 415.1538391113281, 423.1985168457031, 431.24322509765625, 439.28790283203125, 447.3326110839844, 455.3772888183594, 463.4219970703125, 471.4666748046875, 479.5113525390625]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 11.0, 14.0, 11.0, 19.0, 26.0, 19.0, 28.0, 27.0, 31.0, 30.0, 37.0, 44.0, 34.0, 44.0, 45.0, 48.0, 46.0, 42.0, 39.0, 37.0, 38.0, 46.0, 23.0, 42.0, 42.0, 25.0, 26.0, 22.0, 24.0, 12.0, 17.0, 9.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-81.09115600585938, -78.91677856445312, -76.74239349365234, -74.5680160522461, -72.39363098144531, -70.21925354003906, -68.04486846923828, -65.87049102783203, -63.69610595703125, -61.521724700927734, -59.34734344482422, -57.1729621887207, -54.99858093261719, -52.82419967651367, -50.649818420410156, -48.475440979003906, -46.30105972290039, -44.126678466796875, -41.95229721069336, -39.777915954589844, -37.60353469848633, -35.42915344238281, -33.25477600097656, -31.080392837524414, -28.9060115814209, -26.731630325317383, -24.557249069213867, -22.382869720458984, -20.20848846435547, -18.034107208251953, -15.859725952148438, -13.685344696044922, -11.510963439941406, -9.33658218383789, -7.162201404571533, -4.987820625305176, -2.81343936920166, -0.6390581130981445, 1.5353221893310547, 3.7097034454345703, 5.884084701538086, 8.058465957641602, 10.232847213745117, 12.407227516174316, 14.581608772277832, 16.75598907470703, 18.930370330810547, 21.104751586914062, 23.279132843017578, 25.453514099121094, 27.62789535522461, 29.802276611328125, 31.97665786743164, 34.151039123535156, 36.325416564941406, 38.49980163574219, 40.67417907714844, 42.84856033325195, 45.02294158935547, 47.197322845458984, 49.3717041015625, 51.546085357666016, 53.72046661376953, 55.89484405517578, 58.06922912597656]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 12.0, 14.0, 18.0, 11.0, 23.0, 19.0, 14.0, 26.0, 29.0, 40.0, 41.0, 38.0, 57.0, 36.0, 49.0, 45.0, 42.0, 40.0, 47.0, 54.0, 40.0, 43.0, 40.0, 30.0, 33.0, 24.0, 19.0, 24.0, 15.0, 12.0, 13.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.8814697265625, -13.419189453125, -12.9569091796875, -12.49462890625, -12.0323486328125, -11.570068359375, -11.1077880859375, -10.6455078125, -10.1832275390625, -9.720947265625, -9.2586669921875, -8.79638671875, -8.3341064453125, -7.871826171875, -7.4095458984375, -6.947265625, -6.4849853515625, -6.022705078125, -5.5604248046875, -5.09814453125, -4.6358642578125, -4.173583984375, -3.7113037109375, -3.2490234375, -2.7867431640625, -2.324462890625, -1.8621826171875, -1.39990234375, -0.9376220703125, -0.475341796875, -0.0130615234375, 0.44921875, 0.9114990234375, 1.373779296875, 1.8360595703125, 2.29833984375, 2.7606201171875, 3.222900390625, 3.6851806640625, 4.1474609375, 4.6097412109375, 5.072021484375, 5.5343017578125, 5.99658203125, 6.4588623046875, 6.921142578125, 7.3834228515625, 7.845703125, 8.3079833984375, 8.770263671875, 9.2325439453125, 9.69482421875, 10.1571044921875, 10.619384765625, 11.0816650390625, 11.5439453125, 12.0062255859375, 12.468505859375, 12.9307861328125, 13.39306640625, 13.8553466796875, 14.317626953125, 14.7799072265625, 15.2421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 1.0, 5.0, 5.0, 6.0, 10.0, 24.0, 24.0, 38.0, 38.0, 46.0, 83.0, 120.0, 143.0, 190.0, 312.0, 422.0, 744.0, 1362.0, 2850.0, 7877.0, 32414.0, 1099880.0, 2970339.0, 57973.0, 11410.0, 3876.0, 1641.0, 837.0, 510.0, 334.0, 226.0, 146.0, 108.0, 89.0, 61.0, 41.0, 34.0, 25.0, 17.0, 12.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6875, -64.4755859375, -62.263671875, -60.0517578125, -57.83984375, -55.6279296875, -53.416015625, -51.2041015625, -48.9921875, -46.7802734375, -44.568359375, -42.3564453125, -40.14453125, -37.9326171875, -35.720703125, -33.5087890625, -31.296875, -29.0849609375, -26.873046875, -24.6611328125, -22.44921875, -20.2373046875, -18.025390625, -15.8134765625, -13.6015625, -11.3896484375, -9.177734375, -6.9658203125, -4.75390625, -2.5419921875, -0.330078125, 1.8818359375, 4.09375, 6.3056640625, 8.517578125, 10.7294921875, 12.94140625, 15.1533203125, 17.365234375, 19.5771484375, 21.7890625, 24.0009765625, 26.212890625, 28.4248046875, 30.63671875, 32.8486328125, 35.060546875, 37.2724609375, 39.484375, 41.6962890625, 43.908203125, 46.1201171875, 48.33203125, 50.5439453125, 52.755859375, 54.9677734375, 57.1796875, 59.3916015625, 61.603515625, 63.8154296875, 66.02734375, 68.2392578125, 70.451171875, 72.6630859375, 74.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 12.0, 7.0, 17.0, 25.0, 28.0, 37.0, 44.0, 55.0, 86.0, 111.0, 190.0, 236.0, 433.0, 630.0, 655.0, 510.0, 327.0, 183.0, 148.0, 90.0, 63.0, 40.0, 38.0, 26.0, 23.0, 21.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-33.53125, -32.65478515625, -31.7783203125, -30.90185546875, -30.025390625, -29.14892578125, -28.2724609375, -27.39599609375, -26.51953125, -25.64306640625, -24.7666015625, -23.89013671875, -23.013671875, -22.13720703125, -21.2607421875, -20.38427734375, -19.5078125, -18.63134765625, -17.7548828125, -16.87841796875, -16.001953125, -15.12548828125, -14.2490234375, -13.37255859375, -12.49609375, -11.61962890625, -10.7431640625, -9.86669921875, -8.990234375, -8.11376953125, -7.2373046875, -6.36083984375, -5.484375, -4.60791015625, -3.7314453125, -2.85498046875, -1.978515625, -1.10205078125, -0.2255859375, 0.65087890625, 1.52734375, 2.40380859375, 3.2802734375, 4.15673828125, 5.033203125, 5.90966796875, 6.7861328125, 7.66259765625, 8.5390625, 9.41552734375, 10.2919921875, 11.16845703125, 12.044921875, 12.92138671875, 13.7978515625, 14.67431640625, 15.55078125, 16.42724609375, 17.3037109375, 18.18017578125, 19.056640625, 19.93310546875, 20.8095703125, 21.68603515625, 22.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 19.0, 37.0, 62.0, 152.0, 331.0, 969.0, 2963.0, 9701.0, 38964.0, 253093.0, 3273127.0, 534690.0, 60286.0, 13874.0, 3844.0, 1303.0, 455.0, 200.0, 100.0, 47.0, 25.0, 17.0, 6.0, 0.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.4228515625, -31.158203125, -29.8935546875, -28.62890625, -27.3642578125, -26.099609375, -24.8349609375, -23.5703125, -22.3056640625, -21.041015625, -19.7763671875, -18.51171875, -17.2470703125, -15.982421875, -14.7177734375, -13.453125, -12.1884765625, -10.923828125, -9.6591796875, -8.39453125, -7.1298828125, -5.865234375, -4.6005859375, -3.3359375, -2.0712890625, -0.806640625, 0.4580078125, 1.72265625, 2.9873046875, 4.251953125, 5.5166015625, 6.78125, 8.0458984375, 9.310546875, 10.5751953125, 11.83984375, 13.1044921875, 14.369140625, 15.6337890625, 16.8984375, 18.1630859375, 19.427734375, 20.6923828125, 21.95703125, 23.2216796875, 24.486328125, 25.7509765625, 27.015625, 28.2802734375, 29.544921875, 30.8095703125, 32.07421875, 33.3388671875, 34.603515625, 35.8681640625, 37.1328125, 38.3974609375, 39.662109375, 40.9267578125, 42.19140625, 43.4560546875, 44.720703125, 45.9853515625, 47.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 1.0, 5.0, 6.0, 16.0, 7.0, 9.0, 17.0, 16.0, 35.0, 39.0, 35.0, 39.0, 55.0, 53.0, 57.0, 75.0, 70.0, 68.0, 66.0, 62.0, 47.0, 38.0, 37.0, 28.0, 24.0, 22.0, 14.0, 13.0, 13.0, 12.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.01224517822266, -100.30632781982422, -96.60041809082031, -92.89450073242188, -89.18858337402344, -85.482666015625, -81.7767562866211, -78.07083892822266, -74.36492919921875, -70.65901184082031, -66.9531021118164, -63.24718475341797, -59.54126739501953, -55.83535385131836, -52.12944030761719, -48.42352294921875, -44.71760559082031, -41.01169204711914, -37.3057746887207, -33.59986114501953, -29.893945693969727, -26.188030242919922, -22.48211669921875, -18.776201248168945, -15.07028579711914, -11.364370346069336, -7.658455848693848, -3.9525413513183594, -0.2466259002685547, 3.45928955078125, 7.165203094482422, 10.871118545532227, 14.577041625976562, 18.282957077026367, 21.988872528076172, 25.694786071777344, 29.40070152282715, 33.10661697387695, 36.812530517578125, 40.51844787597656, 44.224361419677734, 47.930274963378906, 51.636192321777344, 55.342105865478516, 59.04801940917969, 62.753936767578125, 66.45985412597656, 70.16576385498047, 73.8716812133789, 77.57759857177734, 81.28350830078125, 84.98942565917969, 88.69534301757812, 92.40126037597656, 96.10717010498047, 99.8130874633789, 103.51899719238281, 107.22491455078125, 110.93082427978516, 114.6367416381836, 118.34265899658203, 122.04856872558594, 125.75448608398438, 129.4604034423828, 133.16632080078125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 5.0, 8.0, 12.0, 15.0, 17.0, 13.0, 23.0, 21.0, 22.0, 41.0, 25.0, 42.0, 32.0, 37.0, 35.0, 32.0, 27.0, 46.0, 44.0, 32.0, 28.0, 36.0, 48.0, 27.0, 37.0, 27.0, 30.0, 42.0, 26.0, 27.0, 21.0, 20.0, 17.0, 8.0, 6.0, 5.0, 9.0, 10.0, 5.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-107.6094970703125, -104.57537841796875, -101.541259765625, -98.50714111328125, -95.47303009033203, -92.43891143798828, -89.40479278564453, -86.37067413330078, -83.33656311035156, -80.30244445800781, -77.26832580566406, -74.23420715332031, -71.2000961303711, -68.16597747802734, -65.1318588256836, -62.097740173339844, -59.063621520996094, -56.029502868652344, -52.99538803100586, -49.96126937866211, -46.927154541015625, -43.893035888671875, -40.858917236328125, -37.824798583984375, -34.79068374633789, -31.756567001342773, -28.722450256347656, -25.688331604003906, -22.65421485900879, -19.620098114013672, -16.585979461669922, -13.551862716674805, -10.517738342285156, -7.483621120452881, -4.4495038986206055, -1.4153861999511719, 1.6187305450439453, 4.6528472900390625, 7.6869659423828125, 10.72108268737793, 13.755199432373047, 16.789316177368164, 19.82343292236328, 22.85755157470703, 25.89166831970215, 28.925785064697266, 31.959903717041016, 34.9940185546875, 38.02813720703125, 41.062255859375, 44.096370697021484, 47.130489349365234, 50.16460418701172, 53.19872283935547, 56.23284149169922, 59.26696014404297, 62.30107498168945, 65.33518981933594, 68.36930847167969, 71.40342712402344, 74.43754577636719, 77.47166442871094, 80.50578308105469, 83.5398941040039, 86.57401275634766]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 4.0, 17.0, 17.0, 11.0, 10.0, 21.0, 22.0, 22.0, 30.0, 30.0, 34.0, 36.0, 40.0, 33.0, 35.0, 38.0, 43.0, 41.0, 36.0, 27.0, 40.0, 47.0, 34.0, 29.0, 37.0, 34.0, 32.0, 32.0, 27.0, 22.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.5, -169.81640625, -164.1328125, -158.44921875, -152.765625, -147.08203125, -141.3984375, -135.71484375, -130.03125, -124.34765625, -118.6640625, -112.98046875, -107.296875, -101.61328125, -95.9296875, -90.24609375, -84.5625, -78.87890625, -73.1953125, -67.51171875, -61.828125, -56.14453125, -50.4609375, -44.77734375, -39.09375, -33.41015625, -27.7265625, -22.04296875, -16.359375, -10.67578125, -4.9921875, 0.69140625, 6.375, 12.05859375, 17.7421875, 23.42578125, 29.109375, 34.79296875, 40.4765625, 46.16015625, 51.84375, 57.52734375, 63.2109375, 68.89453125, 74.578125, 80.26171875, 85.9453125, 91.62890625, 97.3125, 102.99609375, 108.6796875, 114.36328125, 120.046875, 125.73046875, 131.4140625, 137.09765625, 142.78125, 148.46484375, 154.1484375, 159.83203125, 165.515625, 171.19921875, 176.8828125, 182.56640625, 188.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 10.0, 17.0, 18.0, 25.0, 31.0, 61.0, 101.0, 113.0, 156.0, 229.0, 361.0, 498.0, 717.0, 1035.0, 1420.0, 2037.0, 3037.0, 4314.0, 6322.0, 9506.0, 14239.0, 22002.0, 34786.0, 55485.0, 90977.0, 154749.0, 234883.0, 158348.0, 93587.0, 56694.0, 34991.0, 22459.0, 14764.0, 9735.0, 6562.0, 4386.0, 2934.0, 2110.0, 1494.0, 1014.0, 718.0, 523.0, 340.0, 232.0, 155.0, 120.0, 86.0, 55.0, 34.0, 30.0, 21.0, 15.0, 12.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03125, -2.935089111328125, -2.83892822265625, -2.742767333984375, -2.6466064453125, -2.550445556640625, -2.45428466796875, -2.358123779296875, -2.261962890625, -2.165802001953125, -2.06964111328125, -1.973480224609375, -1.8773193359375, -1.781158447265625, -1.68499755859375, -1.588836669921875, -1.49267578125, -1.396514892578125, -1.30035400390625, -1.204193115234375, -1.1080322265625, -1.011871337890625, -0.91571044921875, -0.819549560546875, -0.723388671875, -0.627227783203125, -0.53106689453125, -0.434906005859375, -0.3387451171875, -0.242584228515625, -0.14642333984375, -0.050262451171875, 0.0458984375, 0.142059326171875, 0.23822021484375, 0.334381103515625, 0.4305419921875, 0.526702880859375, 0.62286376953125, 0.719024658203125, 0.815185546875, 0.911346435546875, 1.00750732421875, 1.103668212890625, 1.1998291015625, 1.295989990234375, 1.39215087890625, 1.488311767578125, 1.58447265625, 1.680633544921875, 1.77679443359375, 1.872955322265625, 1.9691162109375, 2.065277099609375, 2.16143798828125, 2.257598876953125, 2.353759765625, 2.449920654296875, 2.54608154296875, 2.642242431640625, 2.7384033203125, 2.834564208984375, 2.93072509765625, 3.026885986328125, 3.123046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 12.0, 11.0, 15.0, 15.0, 20.0, 19.0, 19.0, 20.0, 26.0, 33.0, 41.0, 27.0, 30.0, 34.0, 20.0, 43.0, 38.0, 40.0, 1066.0, 36.0, 37.0, 37.0, 39.0, 35.0, 31.0, 31.0, 31.0, 21.0, 27.0, 20.0, 17.0, 11.0, 17.0, 6.0, 16.0, 9.0, 6.0, 3.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.90625, -98.3125, -94.71875, -91.125, -87.53125, -83.9375, -80.34375, -76.75, -73.15625, -69.5625, -65.96875, -62.375, -58.78125, -55.1875, -51.59375, -48.0, -44.40625, -40.8125, -37.21875, -33.625, -30.03125, -26.4375, -22.84375, -19.25, -15.65625, -12.0625, -8.46875, -4.875, -1.28125, 2.3125, 5.90625, 9.5, 13.09375, 16.6875, 20.28125, 23.875, 27.46875, 31.0625, 34.65625, 38.25, 41.84375, 45.4375, 49.03125, 52.625, 56.21875, 59.8125, 63.40625, 67.0, 70.59375, 74.1875, 77.78125, 81.375, 84.96875, 88.5625, 92.15625, 95.75, 99.34375, 102.9375, 106.53125, 110.125, 113.71875, 117.3125, 120.90625, 124.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 13.0, 18.0, 33.0, 58.0, 78.0, 105.0, 162.0, 237.0, 317.0, 447.0, 632.0, 927.0, 1233.0, 1803.0, 2566.0, 3621.0, 5185.0, 7602.0, 11328.0, 16940.0, 26139.0, 39986.0, 63882.0, 102945.0, 172299.0, 1261305.0, 139008.0, 84260.0, 53068.0, 33758.0, 21715.0, 14265.0, 9726.0, 6539.0, 4498.0, 3014.0, 2131.0, 1498.0, 1057.0, 808.0, 590.0, 443.0, 299.0, 197.0, 148.0, 80.0, 57.0, 35.0, 28.0, 21.0, 10.0, 5.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.799957275390625, -1.74053955078125, -1.681121826171875, -1.6217041015625, -1.562286376953125, -1.50286865234375, -1.443450927734375, -1.384033203125, -1.324615478515625, -1.26519775390625, -1.205780029296875, -1.1463623046875, -1.086944580078125, -1.02752685546875, -0.968109130859375, -0.90869140625, -0.849273681640625, -0.78985595703125, -0.730438232421875, -0.6710205078125, -0.611602783203125, -0.55218505859375, -0.492767333984375, -0.433349609375, -0.373931884765625, -0.31451416015625, -0.255096435546875, -0.1956787109375, -0.136260986328125, -0.07684326171875, -0.017425537109375, 0.0419921875, 0.101409912109375, 0.16082763671875, 0.220245361328125, 0.2796630859375, 0.339080810546875, 0.39849853515625, 0.457916259765625, 0.517333984375, 0.576751708984375, 0.63616943359375, 0.695587158203125, 0.7550048828125, 0.814422607421875, 0.87384033203125, 0.933258056640625, 0.99267578125, 1.052093505859375, 1.11151123046875, 1.170928955078125, 1.2303466796875, 1.289764404296875, 1.34918212890625, 1.408599853515625, 1.468017578125, 1.527435302734375, 1.58685302734375, 1.646270751953125, 1.7056884765625, 1.765106201171875, 1.82452392578125, 1.883941650390625, 1.943359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 6.0, 6.0, 17.0, 16.0, 17.0, 22.0, 28.0, 41.0, 42.0, 48.0, 101.0, 213.0, 146.0, 55.0, 54.0, 40.0, 21.0, 30.0, 25.0, 12.0, 6.0, 11.0, 7.0, 3.0, 9.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005252838134765625, -0.005087316036224365, -0.0049217939376831055, -0.004756271839141846, -0.004590749740600586, -0.004425227642059326, -0.004259705543518066, -0.004094183444976807, -0.003928661346435547, -0.003763139247894287, -0.0035976171493530273, -0.0034320950508117676, -0.003266572952270508, -0.003101050853729248, -0.0029355287551879883, -0.0027700066566467285, -0.0026044845581054688, -0.002438962459564209, -0.0022734403610229492, -0.0021079182624816895, -0.0019423961639404297, -0.00177687406539917, -0.0016113519668579102, -0.0014458298683166504, -0.0012803077697753906, -0.0011147856712341309, -0.0009492635726928711, -0.0007837414741516113, -0.0006182193756103516, -0.0004526972770690918, -0.00028717517852783203, -0.00012165307998657227, 4.38690185546875e-05, 0.00020939111709594727, 0.00037491321563720703, 0.0005404353141784668, 0.0007059574127197266, 0.0008714795112609863, 0.001037001609802246, 0.0012025237083435059, 0.0013680458068847656, 0.0015335679054260254, 0.0016990900039672852, 0.001864612102508545, 0.0020301342010498047, 0.0021956562995910645, 0.0023611783981323242, 0.002526700496673584, 0.0026922225952148438, 0.0028577446937561035, 0.0030232667922973633, 0.003188788890838623, 0.003354310989379883, 0.0035198330879211426, 0.0036853551864624023, 0.003850877285003662, 0.004016399383544922, 0.004181921482086182, 0.004347443580627441, 0.004512965679168701, 0.004678487777709961, 0.004844009876251221, 0.0050095319747924805, 0.00517505407333374, 0.005340576171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 2.0, 7.0, 11.0, 8.0, 25.0, 33.0, 58.0, 76.0, 116.0, 221.0, 343.0, 623.0, 1192.0, 2526.0, 5754.0, 15538.0, 50181.0, 214599.0, 602950.0, 107064.0, 29495.0, 9909.0, 3881.0, 1832.0, 902.0, 490.0, 273.0, 167.0, 97.0, 68.0, 43.0, 17.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269622802734375, -0.026127099990844727, -0.025291919708251953, -0.02445673942565918, -0.023621559143066406, -0.022786378860473633, -0.02195119857788086, -0.021116018295288086, -0.020280838012695312, -0.01944565773010254, -0.018610477447509766, -0.017775297164916992, -0.01694011688232422, -0.016104936599731445, -0.015269756317138672, -0.014434576034545898, -0.013599395751953125, -0.012764215469360352, -0.011929035186767578, -0.011093854904174805, -0.010258674621582031, -0.009423494338989258, -0.008588314056396484, -0.007753133773803711, -0.0069179534912109375, -0.006082773208618164, -0.005247592926025391, -0.004412412643432617, -0.0035772323608398438, -0.0027420520782470703, -0.0019068717956542969, -0.0010716915130615234, -0.00023651123046875, 0.0005986690521240234, 0.0014338493347167969, 0.0022690296173095703, 0.0031042098999023438, 0.003939390182495117, 0.004774570465087891, 0.005609750747680664, 0.0064449310302734375, 0.007280111312866211, 0.008115291595458984, 0.008950471878051758, 0.009785652160644531, 0.010620832443237305, 0.011456012725830078, 0.012291193008422852, 0.013126373291015625, 0.013961553573608398, 0.014796733856201172, 0.015631914138793945, 0.01646709442138672, 0.017302274703979492, 0.018137454986572266, 0.01897263526916504, 0.019807815551757812, 0.020642995834350586, 0.02147817611694336, 0.022313356399536133, 0.023148536682128906, 0.02398371696472168, 0.024818897247314453, 0.025654077529907227, 0.0264892578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 17.0, 23.0, 37.0, 78.0, 93.0, 191.0, 177.0, 118.0, 68.0, 41.0, 30.0, 28.0, 22.0, 15.0, 11.0, 8.0, 8.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074348836205899715, -0.007020418532192707, -0.006605953443795443, -0.006191488355398178, -0.005777023732662201, -0.005362558178603649, -0.004948093555867672, -0.0045336284674704075, -0.004119163379073143, -0.0037046982906758785, -0.003290233202278614, -0.0028757683467119932, -0.0024613032583147287, -0.0020468381699174643, -0.0016323733143508434, -0.001217908225953579, -0.0008034431375563145, -0.0003889781073667109, 2.5486922822892666e-05, 0.0004399518948048353, 0.0008544169832020998, 0.0012688820715993643, 0.001683346927165985, 0.0020978120155632496, 0.002512277103960514, 0.0029267421923577785, 0.003341207280755043, 0.003755672136321664, 0.004170137457549572, 0.004584602080285549, 0.004999067168682814, 0.005413532257080078, 0.005827996879816055, 0.00624246196821332, 0.006656927056610584, 0.007071391679346561, 0.007485857233405113, 0.00790032185614109, 0.008314786478877068, 0.00872925203293562, 0.009143717586994171, 0.009558182209730148, 0.0099726477637887, 0.010387112386524677, 0.010801577940583229, 0.011216042563319206, 0.011630507186055183, 0.012044972740113735, 0.012459437362849712, 0.01287390198558569, 0.013288367539644241, 0.013702832162380219, 0.01411729771643877, 0.014531762339174747, 0.0149462278932333, 0.015360692515969276, 0.015775157138705254, 0.01618962176144123, 0.016604086384177208, 0.017018552869558334, 0.01743301749229431, 0.01784748211503029, 0.018261946737766266, 0.018676411360502243, 0.01909087784588337]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 7.0, 6.0, 4.0, 11.0, 11.0, 8.0, 9.0, 17.0, 17.0, 16.0, 16.0, 27.0, 24.0, 22.0, 25.0, 29.0, 28.0, 30.0, 36.0, 31.0, 40.0, 34.0, 35.0, 42.0, 24.0, 33.0, 44.0, 26.0, 24.0, 37.0, 35.0, 31.0, 18.0, 24.0, 20.0, 17.0, 21.0, 19.0, 12.0, 10.0, 11.0, 15.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.004262208938598633, -0.004122590646147728, -0.003982972353696823, -0.0038433540612459183, -0.0037037357687950134, -0.0035641174763441086, -0.0034244991838932037, -0.003284880891442299, -0.003145262598991394, -0.003005644306540489, -0.0028660260140895844, -0.0027264077216386795, -0.0025867894291877747, -0.00244717113673687, -0.002307552844285965, -0.00216793455183506, -0.0020283162593841553, -0.0018886979669332504, -0.0017490796744823456, -0.0016094613820314407, -0.0014698430895805359, -0.001330224797129631, -0.0011906065046787262, -0.0010509882122278214, -0.0009113699197769165, -0.0007717516273260117, -0.0006321333348751068, -0.000492515042424202, -0.0003528967499732971, -0.00021327845752239227, -7.366016507148743e-05, 6.595812737941742e-05, 0.00020557641983032227, 0.0003451947122812271, 0.00048481300473213196, 0.0006244312971830368, 0.0007640495896339417, 0.0009036678820848465, 0.0010432861745357513, 0.0011829044669866562, 0.001322522759437561, 0.0014621410518884659, 0.0016017593443393707, 0.0017413776367902756, 0.0018809959292411804, 0.0020206142216920853, 0.00216023251414299, 0.002299850806593895, 0.0024394690990448, 0.0025790873914957047, 0.0027187056839466095, 0.0028583239763975143, 0.002997942268848419, 0.003137560561299324, 0.003277178853750229, 0.0034167971462011337, 0.0035564154386520386, 0.0036960337311029434, 0.0038356520235538483, 0.003975270316004753, 0.004114888608455658, 0.004254506900906563, 0.004394125193357468, 0.0045337434858083725, 0.004673361778259277]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 3.0, 18.0, 17.0, 11.0, 10.0, 20.0, 22.0, 23.0, 30.0, 30.0, 34.0, 35.0, 39.0, 34.0, 35.0, 39.0, 43.0, 40.0, 37.0, 27.0, 38.0, 49.0, 33.0, 30.0, 37.0, 32.0, 34.0, 32.0, 26.0, 23.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.625, -169.939453125, -164.25390625, -158.568359375, -152.8828125, -147.197265625, -141.51171875, -135.826171875, -130.140625, -124.455078125, -118.76953125, -113.083984375, -107.3984375, -101.712890625, -96.02734375, -90.341796875, -84.65625, -78.970703125, -73.28515625, -67.599609375, -61.9140625, -56.228515625, -50.54296875, -44.857421875, -39.171875, -33.486328125, -27.80078125, -22.115234375, -16.4296875, -10.744140625, -5.05859375, 0.626953125, 6.3125, 11.998046875, 17.68359375, 23.369140625, 29.0546875, 34.740234375, 40.42578125, 46.111328125, 51.796875, 57.482421875, 63.16796875, 68.853515625, 74.5390625, 80.224609375, 85.91015625, 91.595703125, 97.28125, 102.966796875, 108.65234375, 114.337890625, 120.0234375, 125.708984375, 131.39453125, 137.080078125, 142.765625, 148.451171875, 154.13671875, 159.822265625, 165.5078125, 171.193359375, 176.87890625, 182.564453125, 188.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 7.0, 3.0, 14.0, 15.0, 13.0, 18.0, 22.0, 38.0, 65.0, 69.0, 116.0, 208.0, 430.0, 790.0, 1873.0, 5245.0, 16726.0, 66401.0, 332885.0, 483447.0, 103482.0, 24694.0, 7224.0, 2540.0, 1065.0, 456.0, 253.0, 125.0, 79.0, 63.0, 50.0, 28.0, 18.0, 12.0, 18.0, 4.0, 13.0, 10.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.90625, -28.946044921875, -27.98583984375, -27.025634765625, -26.0654296875, -25.105224609375, -24.14501953125, -23.184814453125, -22.224609375, -21.264404296875, -20.30419921875, -19.343994140625, -18.3837890625, -17.423583984375, -16.46337890625, -15.503173828125, -14.54296875, -13.582763671875, -12.62255859375, -11.662353515625, -10.7021484375, -9.741943359375, -8.78173828125, -7.821533203125, -6.861328125, -5.901123046875, -4.94091796875, -3.980712890625, -3.0205078125, -2.060302734375, -1.10009765625, -0.139892578125, 0.8203125, 1.780517578125, 2.74072265625, 3.700927734375, 4.6611328125, 5.621337890625, 6.58154296875, 7.541748046875, 8.501953125, 9.462158203125, 10.42236328125, 11.382568359375, 12.3427734375, 13.302978515625, 14.26318359375, 15.223388671875, 16.18359375, 17.143798828125, 18.10400390625, 19.064208984375, 20.0244140625, 20.984619140625, 21.94482421875, 22.905029296875, 23.865234375, 24.825439453125, 25.78564453125, 26.745849609375, 27.7060546875, 28.666259765625, 29.62646484375, 30.586669921875, 31.546875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 15.0, 24.0, 34.0, 51.0, 78.0, 94.0, 107.0, 148.0, 2085.0, 76.0, 88.0, 73.0, 55.0, 36.0, 30.0, 16.0, 11.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-510.5, -494.0703125, -477.640625, -461.2109375, -444.78125, -428.3515625, -411.921875, -395.4921875, -379.0625, -362.6328125, -346.203125, -329.7734375, -313.34375, -296.9140625, -280.484375, -264.0546875, -247.625, -231.1953125, -214.765625, -198.3359375, -181.90625, -165.4765625, -149.046875, -132.6171875, -116.1875, -99.7578125, -83.328125, -66.8984375, -50.46875, -34.0390625, -17.609375, -1.1796875, 15.25, 31.6796875, 48.109375, 64.5390625, 80.96875, 97.3984375, 113.828125, 130.2578125, 146.6875, 163.1171875, 179.546875, 195.9765625, 212.40625, 228.8359375, 245.265625, 261.6953125, 278.125, 294.5546875, 310.984375, 327.4140625, 343.84375, 360.2734375, 376.703125, 393.1328125, 409.5625, 425.9921875, 442.421875, 458.8515625, 475.28125, 491.7109375, 508.140625, 524.5703125, 541.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 11.0, 15.0, 18.0, 43.0, 43.0, 63.0, 170.0, 205.0, 404.0, 831.0, 2601.0, 27793.0, 2947763.0, 156884.0, 6291.0, 1237.0, 525.0, 303.0, 178.0, 108.0, 66.0, 45.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.9375, -53.8447265625, -51.751953125, -49.6591796875, -47.56640625, -45.4736328125, -43.380859375, -41.2880859375, -39.1953125, -37.1025390625, -35.009765625, -32.9169921875, -30.82421875, -28.7314453125, -26.638671875, -24.5458984375, -22.453125, -20.3603515625, -18.267578125, -16.1748046875, -14.08203125, -11.9892578125, -9.896484375, -7.8037109375, -5.7109375, -3.6181640625, -1.525390625, 0.5673828125, 2.66015625, 4.7529296875, 6.845703125, 8.9384765625, 11.03125, 13.1240234375, 15.216796875, 17.3095703125, 19.40234375, 21.4951171875, 23.587890625, 25.6806640625, 27.7734375, 29.8662109375, 31.958984375, 34.0517578125, 36.14453125, 38.2373046875, 40.330078125, 42.4228515625, 44.515625, 46.6083984375, 48.701171875, 50.7939453125, 52.88671875, 54.9794921875, 57.072265625, 59.1650390625, 61.2578125, 63.3505859375, 65.443359375, 67.5361328125, 69.62890625, 71.7216796875, 73.814453125, 75.9072265625, 78.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 11.0, 16.0, 22.0, 33.0, 77.0, 131.0, 167.0, 186.0, 146.0, 74.0, 36.0, 31.0, 21.0, 11.0, 5.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.74658203125, -414.37811279296875, -401.0096435546875, -387.64117431640625, -374.272705078125, -360.90423583984375, -347.5357971191406, -334.1673278808594, -320.7988586425781, -307.4303894042969, -294.0619201660156, -280.6934509277344, -267.32501220703125, -253.95652770996094, -240.58807373046875, -227.2196044921875, -213.85113525390625, -200.482666015625, -187.11419677734375, -173.74574279785156, -160.3772735595703, -147.00880432128906, -133.64035034179688, -120.27188110351562, -106.90341186523438, -93.53494262695312, -80.1664810180664, -66.79801940917969, -53.42955017089844, -40.06108093261719, -26.69261932373047, -13.32415771484375, 0.044281005859375, 13.41274642944336, 26.781211853027344, 40.14967727661133, 53.51814270019531, 66.88661193847656, 80.25507354736328, 93.62353515625, 106.99200439453125, 120.3604736328125, 133.72894287109375, 147.09739685058594, 160.4658660888672, 173.83433532714844, 187.20278930664062, 200.57125854492188, 213.93972778320312, 227.30819702148438, 240.67666625976562, 254.0451202392578, 267.41357421875, 280.78204345703125, 294.1505126953125, 307.51898193359375, 320.887451171875, 334.25592041015625, 347.6243896484375, 360.99285888671875, 374.361328125, 387.72979736328125, 401.0982360839844, 414.4667053222656, 427.8351745605469]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 12.0, 16.0, 14.0, 17.0, 12.0, 19.0, 18.0, 23.0, 35.0, 22.0, 38.0, 46.0, 43.0, 41.0, 38.0, 42.0, 43.0, 43.0, 44.0, 43.0, 37.0, 31.0, 36.0, 28.0, 33.0, 22.0, 24.0, 26.0, 24.0, 18.0, 15.0, 16.0, 12.0, 8.0, 2.0, 8.0, 9.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.82275390625, -311.8260192871094, -300.8292541503906, -289.83251953125, -278.83575439453125, -267.8390197753906, -256.84228515625, -245.8455352783203, -234.84878540039062, -223.85203552246094, -212.85528564453125, -201.85855102539062, -190.86180114746094, -179.86505126953125, -168.86831665039062, -157.87156677246094, -146.87481689453125, -135.87806701660156, -124.8813247680664, -113.88458251953125, -102.88783264160156, -91.89108276367188, -80.89434051513672, -69.89759826660156, -58.900848388671875, -47.90410232543945, -36.90735626220703, -25.91061019897461, -14.913864135742188, -3.9171180725097656, 7.079627990722656, 18.076370239257812, 29.0731201171875, 40.06986618041992, 51.066612243652344, 62.063358306884766, 73.06010437011719, 84.05685424804688, 95.05359649658203, 106.05033874511719, 117.04708862304688, 128.04383850097656, 139.04058837890625, 150.03732299804688, 161.03407287597656, 172.03082275390625, 183.02755737304688, 194.02430725097656, 205.02105712890625, 216.01780700683594, 227.01455688476562, 238.01129150390625, 249.00804138183594, 260.0047912597656, 271.00152587890625, 281.998291015625, 292.9950256347656, 303.99176025390625, 314.988525390625, 325.9852600097656, 336.98199462890625, 347.978759765625, 358.9754943847656, 369.97222900390625, 380.968994140625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 10.0, 14.0, 22.0, 23.0, 27.0, 33.0, 37.0, 58.0, 68.0, 77.0, 87.0, 131.0, 155.0, 203.0, 282.0, 391.0, 562.0, 895.0, 1041470.0, 1215.0, 714.0, 509.0, 391.0, 265.0, 195.0, 135.0, 109.0, 82.0, 80.0, 61.0, 46.0, 40.0, 29.0, 25.0, 23.0, 14.0, 11.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-129.21395874023438, -125.506103515625, -121.79825592041016, -118.09040069580078, -114.38255310058594, -110.67469787597656, -106.96684265136719, -103.25899505615234, -99.55113983154297, -95.8432846069336, -92.13543701171875, -88.42758178710938, -84.71973419189453, -81.01187896728516, -77.30403137207031, -73.59617614746094, -69.88832092285156, -66.18046569824219, -62.472618103027344, -58.76476287841797, -55.05691146850586, -51.34906005859375, -47.64120864868164, -43.93335723876953, -40.22550964355469, -36.51765823364258, -32.80980682373047, -29.101953506469727, -25.394100189208984, -21.686248779296875, -17.978397369384766, -14.270544052124023, -10.562690734863281, -6.8548383712768555, -3.146986484527588, 0.5608654022216797, 4.2687177658081055, 7.976570129394531, 11.68442153930664, 15.392274856567383, 19.100126266479492, 22.8079776763916, 26.515830993652344, 30.223682403564453, 33.93153381347656, 37.63938903808594, 41.34723663330078, 45.055091857910156, 48.762943267822266, 52.470794677734375, 56.178646087646484, 59.886497497558594, 63.59435272216797, 67.30220031738281, 71.01005554199219, 74.71791076660156, 78.4257583618164, 82.13361358642578, 85.84146118164062, 89.54931640625, 93.25716400146484, 96.96501922607422, 100.67286682128906, 104.38072204589844, 108.08857727050781]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 9.0, 11.0, 20.0, 22.0, 31.0, 46.0, 129.0, 796.0, 51427168.0, 34027.0, 662.0, 108.0, 41.0, 18.0, 16.0, 9.0, 5.0, 8.0, 13.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-947.4556884765625, -910.9619750976562, -874.46826171875, -837.9745483398438, -801.4808349609375, -764.9871826171875, -728.4934692382812, -691.999755859375, -655.5060424804688, -619.0123291015625, -582.5186157226562, -546.02490234375, -509.5312194824219, -473.0375061035156, -436.5438232421875, -400.05010986328125, -363.556396484375, -327.06268310546875, -290.5689697265625, -254.07528686523438, -217.58157348632812, -181.08786010742188, -144.5941619873047, -108.1004638671875, -71.60675048828125, -35.11304473876953, 1.3806610107421875, 37.874366760253906, 74.36807250976562, 110.86178588867188, 147.35548400878906, 183.84918212890625, 220.3427734375, 256.83648681640625, 293.3302001953125, 329.8238830566406, 366.3175964355469, 402.8113098144531, 439.30499267578125, 475.7987060546875, 512.2924194335938, 548.7861328125, 585.2798461914062, 621.7735595703125, 658.2672119140625, 694.760986328125, 731.254638671875, 767.7483520507812, 804.2420654296875, 840.7357788085938, 877.2294921875, 913.7232055664062, 950.2169189453125, 986.7105712890625, 1023.2042846679688, 1059.697998046875, 1096.191650390625, 1132.685302734375, 1169.1790771484375, 1205.6727294921875, 1242.16650390625, 1278.66015625, 1315.1539306640625, 1351.6475830078125, 1388.141357421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 15.0, 22.0, 38.0, 78.0, 171.0, 239.0, 400.0, 516.0, 761.0, 1069.0, 1518.0, 2360.0, 3605.0, 5586.0, 8668.0, 14220.0, 22126.0, 36893.0, 61161.0, 104489.0, 182662.0, 339232.0, 686611.0, 3895359.0, 403631.0, 215679.0, 121105.0, 71208.0, 42044.0, 25633.0, 15983.0, 9860.0, 6256.0, 4240.0, 2722.0, 1786.0, 1171.0, 772.0, 456.0, 345.0, 214.0, 137.0, 98.0, 76.0, 74.0, 54.0, 34.0, 23.0, 8.0, 7.0, 0.0, 0.0, 2.0], "bins": [-1.248046875, -1.21148681640625, -1.1749267578125, -1.13836669921875, -1.101806640625, -1.06524658203125, -1.0286865234375, -0.99212646484375, -0.95556640625, -0.91900634765625, -0.8824462890625, -0.84588623046875, -0.809326171875, -0.77276611328125, -0.7362060546875, -0.69964599609375, -0.6630859375, -0.62652587890625, -0.5899658203125, -0.55340576171875, -0.516845703125, -0.48028564453125, -0.4437255859375, -0.40716552734375, -0.37060546875, -0.33404541015625, -0.2974853515625, -0.26092529296875, -0.224365234375, -0.18780517578125, -0.1512451171875, -0.11468505859375, -0.078125, -0.04156494140625, -0.0050048828125, 0.03155517578125, 0.068115234375, 0.10467529296875, 0.1412353515625, 0.17779541015625, 0.21435546875, 0.25091552734375, 0.2874755859375, 0.32403564453125, 0.360595703125, 0.39715576171875, 0.4337158203125, 0.47027587890625, 0.5068359375, 0.54339599609375, 0.5799560546875, 0.61651611328125, 0.653076171875, 0.68963623046875, 0.7261962890625, 0.76275634765625, 0.79931640625, 0.83587646484375, 0.8724365234375, 0.90899658203125, 0.945556640625, 0.98211669921875, 1.0186767578125, 1.05523681640625, 1.091796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 7.0, 11.0, 14.0, 10.0, 25.0, 16.0, 32.0, 26.0, 27.0, 42.0, 32.0, 41.0, 32.0, 37.0, 40.0, 39.0, 1087.0, 37.0, 51.0, 41.0, 35.0, 35.0, 44.0, 27.0, 33.0, 36.0, 24.0, 26.0, 27.0, 14.0, 10.0, 11.0, 7.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0], "bins": [-114.6875, -111.4384765625, -108.189453125, -104.9404296875, -101.69140625, -98.4423828125, -95.193359375, -91.9443359375, -88.6953125, -85.4462890625, -82.197265625, -78.9482421875, -75.69921875, -72.4501953125, -69.201171875, -65.9521484375, -62.703125, -59.4541015625, -56.205078125, -52.9560546875, -49.70703125, -46.4580078125, -43.208984375, -39.9599609375, -36.7109375, -33.4619140625, -30.212890625, -26.9638671875, -23.71484375, -20.4658203125, -17.216796875, -13.9677734375, -10.71875, -7.4697265625, -4.220703125, -0.9716796875, 2.27734375, 5.5263671875, 8.775390625, 12.0244140625, 15.2734375, 18.5224609375, 21.771484375, 25.0205078125, 28.26953125, 31.5185546875, 34.767578125, 38.0166015625, 41.265625, 44.5146484375, 47.763671875, 51.0126953125, 54.26171875, 57.5107421875, 60.759765625, 64.0087890625, 67.2578125, 70.5068359375, 73.755859375, 77.0048828125, 80.25390625, 83.5029296875, 86.751953125, 90.0009765625, 93.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 5.0, 5.0, 10.0, 18.0, 13.0, 30.0, 49.0, 54.0, 58.0, 122.0, 133.0, 216.0, 329.0, 497.0, 697.0, 1037.0, 1463.0, 2079.0, 3157.0, 4877.0, 7059.0, 10526.0, 16452.0, 24488.0, 37595.0, 57265.0, 88896.0, 143730.0, 249456.0, 474989.0, 4007283.0, 492365.0, 255988.0, 148192.0, 90765.0, 58786.0, 38065.0, 25262.0, 16427.0, 11012.0, 7142.0, 4888.0, 3155.0, 2086.0, 1489.0, 1044.0, 642.0, 455.0, 331.0, 245.0, 174.0, 114.0, 56.0, 59.0, 25.0, 28.0, 19.0, 12.0, 18.0, 10.0, 5.0], "bins": [-1.482421875, -1.438201904296875, -1.39398193359375, -1.349761962890625, -1.3055419921875, -1.261322021484375, -1.21710205078125, -1.172882080078125, -1.128662109375, -1.084442138671875, -1.04022216796875, -0.996002197265625, -0.9517822265625, -0.907562255859375, -0.86334228515625, -0.819122314453125, -0.77490234375, -0.730682373046875, -0.68646240234375, -0.642242431640625, -0.5980224609375, -0.553802490234375, -0.50958251953125, -0.465362548828125, -0.421142578125, -0.376922607421875, -0.33270263671875, -0.288482666015625, -0.2442626953125, -0.200042724609375, -0.15582275390625, -0.111602783203125, -0.0673828125, -0.023162841796875, 0.02105712890625, 0.065277099609375, 0.1094970703125, 0.153717041015625, 0.19793701171875, 0.242156982421875, 0.286376953125, 0.330596923828125, 0.37481689453125, 0.419036865234375, 0.4632568359375, 0.507476806640625, 0.55169677734375, 0.595916748046875, 0.64013671875, 0.684356689453125, 0.72857666015625, 0.772796630859375, 0.8170166015625, 0.861236572265625, 0.90545654296875, 0.949676513671875, 0.993896484375, 1.038116455078125, 1.08233642578125, 1.126556396484375, 1.1707763671875, 1.214996337890625, 1.25921630859375, 1.303436279296875, 1.34765625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 3.0, 4.0, 11.0, 15.0, 13.0, 14.0, 20.0, 21.0, 24.0, 24.0, 24.0, 30.0, 35.0, 33.0, 46.0, 35.0, 43.0, 40.0, 33.0, 1062.0, 29.0, 43.0, 34.0, 39.0, 36.0, 33.0, 26.0, 25.0, 25.0, 24.0, 22.0, 27.0, 23.0, 14.0, 17.0, 18.0, 5.0, 12.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.5, -124.275390625, -120.05078125, -115.826171875, -111.6015625, -107.376953125, -103.15234375, -98.927734375, -94.703125, -90.478515625, -86.25390625, -82.029296875, -77.8046875, -73.580078125, -69.35546875, -65.130859375, -60.90625, -56.681640625, -52.45703125, -48.232421875, -44.0078125, -39.783203125, -35.55859375, -31.333984375, -27.109375, -22.884765625, -18.66015625, -14.435546875, -10.2109375, -5.986328125, -1.76171875, 2.462890625, 6.6875, 10.912109375, 15.13671875, 19.361328125, 23.5859375, 27.810546875, 32.03515625, 36.259765625, 40.484375, 44.708984375, 48.93359375, 53.158203125, 57.3828125, 61.607421875, 65.83203125, 70.056640625, 74.28125, 78.505859375, 82.73046875, 86.955078125, 91.1796875, 95.404296875, 99.62890625, 103.853515625, 108.078125, 112.302734375, 116.52734375, 120.751953125, 124.9765625, 129.201171875, 133.42578125, 137.650390625, 141.875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 21.0, 13.0, 31.0, 55.0, 63.0, 109.0, 120.0, 150.0, 253.0, 382.0, 455.0, 644.0, 854.0, 1324.0, 1746.0, 2452.0, 3451.0, 5080.0, 7461.0, 10768.0, 16349.0, 26865.0, 48420.0, 141316.0, 5745100.0, 149459.0, 49473.0, 26939.0, 16649.0, 10720.0, 7543.0, 5030.0, 3426.0, 2367.0, 1833.0, 1219.0, 862.0, 687.0, 499.0, 322.0, 244.0, 184.0, 137.0, 81.0, 70.0, 42.0, 36.0, 54.0, 23.0, 10.0, 5.0, 3.0, 5.0, 7.0, 4.0], "bins": [-3.71875, -3.6077880859375, -3.496826171875, -3.3858642578125, -3.27490234375, -3.1639404296875, -3.052978515625, -2.9420166015625, -2.8310546875, -2.7200927734375, -2.609130859375, -2.4981689453125, -2.38720703125, -2.2762451171875, -2.165283203125, -2.0543212890625, -1.943359375, -1.8323974609375, -1.721435546875, -1.6104736328125, -1.49951171875, -1.3885498046875, -1.277587890625, -1.1666259765625, -1.0556640625, -0.9447021484375, -0.833740234375, -0.7227783203125, -0.61181640625, -0.5008544921875, -0.389892578125, -0.2789306640625, -0.16796875, -0.0570068359375, 0.053955078125, 0.1649169921875, 0.27587890625, 0.3868408203125, 0.497802734375, 0.6087646484375, 0.7197265625, 0.8306884765625, 0.941650390625, 1.0526123046875, 1.16357421875, 1.2745361328125, 1.385498046875, 1.4964599609375, 1.607421875, 1.7183837890625, 1.829345703125, 1.9403076171875, 2.05126953125, 2.1622314453125, 2.273193359375, 2.3841552734375, 2.4951171875, 2.6060791015625, 2.717041015625, 2.8280029296875, 2.93896484375, 3.0499267578125, 3.160888671875, 3.2718505859375, 3.3828125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 11.0, 13.0, 12.0, 13.0, 13.0, 11.0, 25.0, 21.0, 31.0, 35.0, 33.0, 22.0, 35.0, 39.0, 48.0, 46.0, 44.0, 1069.0, 41.0, 38.0, 46.0, 34.0, 37.0, 31.0, 35.0, 33.0, 34.0, 20.0, 21.0, 17.0, 13.0, 15.0, 8.0, 15.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-194.25, -188.568359375, -182.88671875, -177.205078125, -171.5234375, -165.841796875, -160.16015625, -154.478515625, -148.796875, -143.115234375, -137.43359375, -131.751953125, -126.0703125, -120.388671875, -114.70703125, -109.025390625, -103.34375, -97.662109375, -91.98046875, -86.298828125, -80.6171875, -74.935546875, -69.25390625, -63.572265625, -57.890625, -52.208984375, -46.52734375, -40.845703125, -35.1640625, -29.482421875, -23.80078125, -18.119140625, -12.4375, -6.755859375, -1.07421875, 4.607421875, 10.2890625, 15.970703125, 21.65234375, 27.333984375, 33.015625, 38.697265625, 44.37890625, 50.060546875, 55.7421875, 61.423828125, 67.10546875, 72.787109375, 78.46875, 84.150390625, 89.83203125, 95.513671875, 101.1953125, 106.876953125, 112.55859375, 118.240234375, 123.921875, 129.603515625, 135.28515625, 140.966796875, 146.6484375, 152.330078125, 158.01171875, 163.693359375, 169.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 8.0, 17.0, 30.0, 50.0, 94.0, 503.0, 135.0, 42.0, 34.0, 19.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.89189147949219, -105.8975601196289, -99.9032211303711, -93.90888977050781, -87.91455078125, -81.92021942138672, -75.92588806152344, -69.93154907226562, -63.937217712402344, -57.9428825378418, -51.94854736328125, -45.95421600341797, -39.95988082885742, -33.965545654296875, -27.971214294433594, -21.976879119873047, -15.9825439453125, -9.98820972442627, -3.993875503540039, 2.000457763671875, 7.994792938232422, 13.989128112792969, 19.98345947265625, 25.977794647216797, 31.972129821777344, 37.96646499633789, 43.96080017089844, 49.95513153076172, 55.949466705322266, 61.94380187988281, 67.9381332397461, 73.93246459960938, 79.92678833007812, 85.9211196899414, 91.91545867919922, 97.9097900390625, 103.90412902832031, 109.8984603881836, 115.89279174804688, 121.88713073730469, 127.88146209716797, 133.87579345703125, 139.87013244628906, 145.86447143554688, 151.85879516601562, 157.85313415527344, 163.84747314453125, 169.841796875, 175.8361358642578, 181.83047485351562, 187.82479858398438, 193.8191375732422, 199.8134765625, 205.80780029296875, 211.80213928222656, 217.79647827148438, 223.79080200195312, 229.78514099121094, 235.7794647216797, 241.7738037109375, 247.7681427001953, 253.76248168945312, 259.7568054199219, 265.7511291503906, 271.7454833984375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 13.0, 50.0, 308.0, 463.0, 122.0, 18.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1459.41357421875, -1422.2220458984375, -1385.030517578125, -1347.8388671875, -1310.6473388671875, -1273.455810546875, -1236.2642822265625, -1199.07275390625, -1161.881103515625, -1124.6895751953125, -1087.498046875, -1050.306396484375, -1013.1148681640625, -975.92333984375, -938.7318115234375, -901.5402221679688, -864.3486938476562, -827.1571655273438, -789.965576171875, -752.7740478515625, -715.5824584960938, -678.3909301757812, -641.1993408203125, -604.0078125, -566.8162841796875, -529.624755859375, -492.43316650390625, -455.24163818359375, -418.050048828125, -380.8585205078125, -343.6669616699219, -306.47540283203125, -269.28375244140625, -232.09219360351562, -194.900634765625, -157.70909118652344, -120.51753234863281, -83.32597351074219, -46.134429931640625, -8.94287109375, 28.248687744140625, 65.44024658203125, 102.63179779052734, 139.82334899902344, 177.01490783691406, 214.2064666748047, 251.39801025390625, 288.5895690917969, 325.7811279296875, 362.9726867675781, 400.16424560546875, 437.35577392578125, 474.54736328125, 511.7388916015625, 548.930419921875, 586.1220092773438, 623.3135986328125, 660.505126953125, 697.6967163085938, 734.8882446289062, 772.079833984375, 809.2713623046875, 846.462890625, 883.6544799804688, 920.8460083007812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 3.0, 7.0, 7.0, 6.0, 15.0, 7.0, 6.0, 21.0, 12.0, 14.0, 9.0, 16.0, 17.0, 15.0, 18.0, 9.0, 19.0, 19.0, 23.0, 28.0, 39.0, 46.0, 47.0, 66.0, 64.0, 76.0, 84.0, 89.0, 156.0, 257.0, 379.0, 647.0, 1059.0, 1865.0, 2874.0, 8490.0, 4126628.0, 34373.0, 7266.0, 4409.0, 2054.0, 1028.0, 562.0, 374.0, 263.0, 194.0, 159.0, 137.0, 94.0, 63.0, 56.0, 40.0, 24.0, 14.0, 9.0, 10.0, 7.0], "bins": [-11.703125, -11.43695068359375, -11.1707763671875, -10.90460205078125, -10.638427734375, -10.37225341796875, -10.1060791015625, -9.83990478515625, -9.57373046875, -9.30755615234375, -9.0413818359375, -8.77520751953125, -8.509033203125, -8.24285888671875, -7.9766845703125, -7.71051025390625, -7.4443359375, -7.17816162109375, -6.9119873046875, -6.64581298828125, -6.379638671875, -6.11346435546875, -5.8472900390625, -5.58111572265625, -5.31494140625, -5.04876708984375, -4.7825927734375, -4.51641845703125, -4.250244140625, -3.98406982421875, -3.7178955078125, -3.45172119140625, -3.185546875, -2.91937255859375, -2.6531982421875, -2.38702392578125, -2.120849609375, -1.85467529296875, -1.5885009765625, -1.32232666015625, -1.05615234375, -0.78997802734375, -0.5238037109375, -0.25762939453125, 0.008544921875, 0.27471923828125, 0.5408935546875, 0.80706787109375, 1.0732421875, 1.33941650390625, 1.6055908203125, 1.87176513671875, 2.137939453125, 2.40411376953125, 2.6702880859375, 2.93646240234375, 3.20263671875, 3.46881103515625, 3.7349853515625, 4.00115966796875, 4.267333984375, 4.53350830078125, 4.7996826171875, 5.06585693359375, 5.33203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 22.0, 27.0, 463.0, 403.0, 22.0, 14.0, 16.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7610969543457031, -0.7433853149414062, -0.7256736755371094, -0.7079620361328125, -0.6902503967285156, -0.6725387573242188, -0.6548271179199219, -0.637115478515625, -0.6194038391113281, -0.6016921997070312, -0.5839805603027344, -0.5662689208984375, -0.5485572814941406, -0.5308456420898438, -0.5131340026855469, -0.49542236328125, -0.4777107238769531, -0.45999908447265625, -0.4422874450683594, -0.4245758056640625, -0.4068641662597656, -0.38915252685546875, -0.3714408874511719, -0.353729248046875, -0.3360176086425781, -0.31830596923828125, -0.3005943298339844, -0.2828826904296875, -0.2651710510253906, -0.24745941162109375, -0.22974777221679688, -0.2120361328125, -0.19432449340820312, -0.17661285400390625, -0.15890121459960938, -0.1411895751953125, -0.12347793579101562, -0.10576629638671875, -0.08805465698242188, -0.070343017578125, -0.052631378173828125, -0.03491973876953125, -0.017208099365234375, 0.0005035400390625, 0.018215179443359375, 0.03592681884765625, 0.053638458251953125, 0.07135009765625, 0.08906173706054688, 0.10677337646484375, 0.12448501586914062, 0.1421966552734375, 0.15990829467773438, 0.17761993408203125, 0.19533157348632812, 0.213043212890625, 0.23075485229492188, 0.24846649169921875, 0.2661781311035156, 0.2838897705078125, 0.3016014099121094, 0.31931304931640625, 0.3370246887207031, 0.354736328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 15.0, 18.0, 24.0, 34.0, 45.0, 71.0, 102.0, 130.0, 197.0, 313.0, 458.0, 717.0, 1222.0, 1972.0, 3600.0, 6696.0, 14394.0, 49162.0, 4050491.0, 36487.0, 12906.0, 6212.0, 3552.0, 2036.0, 1260.0, 766.0, 511.0, 319.0, 190.0, 119.0, 87.0, 47.0, 29.0, 26.0, 13.0, 7.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.431640625, -1.386016845703125, -1.34039306640625, -1.294769287109375, -1.2491455078125, -1.203521728515625, -1.15789794921875, -1.112274169921875, -1.066650390625, -1.021026611328125, -0.97540283203125, -0.929779052734375, -0.8841552734375, -0.838531494140625, -0.79290771484375, -0.747283935546875, -0.70166015625, -0.656036376953125, -0.61041259765625, -0.564788818359375, -0.5191650390625, -0.473541259765625, -0.42791748046875, -0.382293701171875, -0.336669921875, -0.291046142578125, -0.24542236328125, -0.199798583984375, -0.1541748046875, -0.108551025390625, -0.06292724609375, -0.017303466796875, 0.0283203125, 0.073944091796875, 0.11956787109375, 0.165191650390625, 0.2108154296875, 0.256439208984375, 0.30206298828125, 0.347686767578125, 0.393310546875, 0.438934326171875, 0.48455810546875, 0.530181884765625, 0.5758056640625, 0.621429443359375, 0.66705322265625, 0.712677001953125, 0.75830078125, 0.803924560546875, 0.84954833984375, 0.895172119140625, 0.9407958984375, 0.986419677734375, 1.03204345703125, 1.077667236328125, 1.123291015625, 1.168914794921875, 1.21453857421875, 1.260162353515625, 1.3057861328125, 1.351409912109375, 1.39703369140625, 1.442657470703125, 1.48828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 10.0, 9.0, 14.0, 15.0, 22.0, 18.0, 144.0, 3635.0, 28.0, 21.0, 17.0, 22.0, 16.0, 15.0, 10.0, 11.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6380386352539062, -0.6212921142578125, -0.6045455932617188, -0.587799072265625, -0.5710525512695312, -0.5543060302734375, -0.5375595092773438, -0.52081298828125, -0.5040664672851562, -0.4873199462890625, -0.47057342529296875, -0.453826904296875, -0.43708038330078125, -0.4203338623046875, -0.40358734130859375, -0.3868408203125, -0.37009429931640625, -0.3533477783203125, -0.33660125732421875, -0.319854736328125, -0.30310821533203125, -0.2863616943359375, -0.26961517333984375, -0.25286865234375, -0.23612213134765625, -0.2193756103515625, -0.20262908935546875, -0.185882568359375, -0.16913604736328125, -0.1523895263671875, -0.13564300537109375, -0.118896484375, -0.10214996337890625, -0.0854034423828125, -0.06865692138671875, -0.051910400390625, -0.03516387939453125, -0.0184173583984375, -0.00167083740234375, 0.01507568359375, 0.03182220458984375, 0.0485687255859375, 0.06531524658203125, 0.082061767578125, 0.09880828857421875, 0.1155548095703125, 0.13230133056640625, 0.1490478515625, 0.16579437255859375, 0.1825408935546875, 0.19928741455078125, 0.216033935546875, 0.23278045654296875, 0.2495269775390625, 0.26627349853515625, 0.28302001953125, 0.29976654052734375, 0.3165130615234375, 0.33325958251953125, 0.350006103515625, 0.36675262451171875, 0.3834991455078125, 0.40024566650390625, 0.4169921875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 14.0, 66.0, 782.0, 95.0, 19.0, 15.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5481555461883545, -2.2760331630706787, -2.003910541534424, -1.731788158416748, -1.4596656560897827, -1.1875431537628174, -0.9154207706451416, -0.6432982683181763, -0.37117576599121094, -0.099053293466568, 0.17306917905807495, 0.4451916217803955, 0.7173141241073608, 0.9894366264343262, 1.261559009552002, 1.5336815118789673, 1.8058040142059326, 2.0779263973236084, 2.3500490188598633, 2.622171401977539, 2.894293785095215, 3.1664164066314697, 3.4385387897491455, 3.7106614112854004, 3.982783794403076, 4.254906177520752, 4.527028560638428, 4.799151420593262, 5.0712738037109375, 5.343396186828613, 5.615518569946289, 5.887640953063965, 6.159763336181641, 6.431885719299316, 6.704008102416992, 6.976130485534668, 7.248253345489502, 7.520375728607178, 7.7924981117248535, 8.064620971679688, 8.336743354797363, 8.608865737915039, 8.880988121032715, 9.15311050415039, 9.425232887268066, 9.697355270385742, 9.969478607177734, 10.24160099029541, 10.513723373413086, 10.785845756530762, 11.057968139648438, 11.330090522766113, 11.602212905883789, 11.874336242675781, 12.14645767211914, 12.418581008911133, 12.690702438354492, 12.962824821472168, 13.234947204589844, 13.50706958770752, 13.779191970825195, 14.051315307617188, 14.323436737060547, 14.595560073852539, 14.867682456970215]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 22.0, 30.0, 45.0, 71.0, 97.0, 136.0, 141.0, 160.0, 116.0, 60.0, 47.0, 21.0, 13.0, 15.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.243732213973999, -3.1306803226470947, -3.0176284313201904, -2.904576539993286, -2.791524648666382, -2.6784727573394775, -2.5654208660125732, -2.452368974685669, -2.3393170833587646, -2.2262651920318604, -2.113213300704956, -2.0001614093780518, -1.8871095180511475, -1.7740576267242432, -1.6610057353973389, -1.5479538440704346, -1.4349019527435303, -1.321850061416626, -1.2087981700897217, -1.0957462787628174, -0.9826943874359131, -0.8696424961090088, -0.7565906047821045, -0.6435387134552002, -0.5304868221282959, -0.4174349308013916, -0.3043830394744873, -0.191331148147583, -0.07827925682067871, 0.034772634506225586, 0.14782452583312988, 0.2608764171600342, 0.3739280700683594, 0.48697996139526367, 0.600031852722168, 0.7130837440490723, 0.8261356353759766, 0.9391875267028809, 1.0522394180297852, 1.1652913093566895, 1.2783432006835938, 1.391395092010498, 1.5044469833374023, 1.6174988746643066, 1.730550765991211, 1.8436026573181152, 1.9566545486450195, 2.069706439971924, 2.182758331298828, 2.2958102226257324, 2.4088621139526367, 2.521914005279541, 2.6349658966064453, 2.7480177879333496, 2.861069679260254, 2.974121570587158, 3.0871734619140625, 3.200225353240967, 3.313277244567871, 3.4263291358947754, 3.5393810272216797, 3.652432918548584, 3.7654848098754883, 3.8785367012023926, 3.991588592529297]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 13.0, 6.0, 15.0, 12.0, 13.0, 24.0, 23.0, 35.0, 85.0, 99.0, 150.0, 211.0, 452.0, 896.0, 2239.0, 8225.0, 83593.0, 937778.0, 9856.0, 2598.0, 988.0, 457.0, 257.0, 165.0, 110.0, 59.0, 55.0, 30.0, 17.0, 21.0, 19.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.203338623046875, -5.05902099609375, -4.914703369140625, -4.7703857421875, -4.626068115234375, -4.48175048828125, -4.337432861328125, -4.193115234375, -4.048797607421875, -3.90447998046875, -3.760162353515625, -3.6158447265625, -3.471527099609375, -3.32720947265625, -3.182891845703125, -3.03857421875, -2.894256591796875, -2.74993896484375, -2.605621337890625, -2.4613037109375, -2.316986083984375, -2.17266845703125, -2.028350830078125, -1.884033203125, -1.739715576171875, -1.59539794921875, -1.451080322265625, -1.3067626953125, -1.162445068359375, -1.01812744140625, -0.873809814453125, -0.7294921875, -0.585174560546875, -0.44085693359375, -0.296539306640625, -0.1522216796875, -0.007904052734375, 0.13641357421875, 0.280731201171875, 0.425048828125, 0.569366455078125, 0.71368408203125, 0.858001708984375, 1.0023193359375, 1.146636962890625, 1.29095458984375, 1.435272216796875, 1.57958984375, 1.723907470703125, 1.86822509765625, 2.012542724609375, 2.1568603515625, 2.301177978515625, 2.44549560546875, 2.589813232421875, 2.734130859375, 2.878448486328125, 3.02276611328125, 3.167083740234375, 3.3114013671875, 3.455718994140625, 3.60003662109375, 3.744354248046875, 3.888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 1.0, 10.0, 22.0, 30.0, 819.0, 44.0, 20.0, 17.0, 13.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7543525695800781, -0.7367324829101562, -0.7191123962402344, -0.7014923095703125, -0.6838722229003906, -0.6662521362304688, -0.6486320495605469, -0.631011962890625, -0.6133918762207031, -0.5957717895507812, -0.5781517028808594, -0.5605316162109375, -0.5429115295410156, -0.5252914428710938, -0.5076713562011719, -0.49005126953125, -0.4724311828613281, -0.45481109619140625, -0.4371910095214844, -0.4195709228515625, -0.4019508361816406, -0.38433074951171875, -0.3667106628417969, -0.349090576171875, -0.3314704895019531, -0.31385040283203125, -0.2962303161621094, -0.2786102294921875, -0.2609901428222656, -0.24337005615234375, -0.22574996948242188, -0.2081298828125, -0.19050979614257812, -0.17288970947265625, -0.15526962280273438, -0.1376495361328125, -0.12002944946289062, -0.10240936279296875, -0.08478927612304688, -0.067169189453125, -0.049549102783203125, -0.03192901611328125, -0.014308929443359375, 0.0033111572265625, 0.020931243896484375, 0.03855133056640625, 0.056171417236328125, 0.07379150390625, 0.09141159057617188, 0.10903167724609375, 0.12665176391601562, 0.1442718505859375, 0.16189193725585938, 0.17951202392578125, 0.19713211059570312, 0.214752197265625, 0.23237228393554688, 0.24999237060546875, 0.2676124572753906, 0.2852325439453125, 0.3028526306152344, 0.32047271728515625, 0.3380928039550781, 0.355712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 7.0, 2.0, 9.0, 21.0, 16.0, 27.0, 41.0, 44.0, 73.0, 102.0, 123.0, 182.0, 274.0, 417.0, 630.0, 921.0, 1374.0, 2149.0, 3589.0, 5943.0, 9665.0, 16955.0, 32085.0, 71849.0, 355580.0, 397627.0, 73494.0, 32439.0, 16800.0, 9871.0, 5989.0, 3587.0, 2274.0, 1506.0, 945.0, 635.0, 373.0, 279.0, 214.0, 133.0, 103.0, 68.0, 40.0, 17.0, 18.0, 26.0, 9.0, 8.0, 10.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.59814453125, -0.5800247192382812, -0.5619049072265625, -0.5437850952148438, -0.525665283203125, -0.5075454711914062, -0.4894256591796875, -0.47130584716796875, -0.45318603515625, -0.43506622314453125, -0.4169464111328125, -0.39882659912109375, -0.380706787109375, -0.36258697509765625, -0.3444671630859375, -0.32634735107421875, -0.3082275390625, -0.29010772705078125, -0.2719879150390625, -0.25386810302734375, -0.235748291015625, -0.21762847900390625, -0.1995086669921875, -0.18138885498046875, -0.16326904296875, -0.14514923095703125, -0.1270294189453125, -0.10890960693359375, -0.090789794921875, -0.07266998291015625, -0.0545501708984375, -0.03643035888671875, -0.018310546875, -0.00019073486328125, 0.0179290771484375, 0.03604888916015625, 0.054168701171875, 0.07228851318359375, 0.0904083251953125, 0.10852813720703125, 0.12664794921875, 0.14476776123046875, 0.1628875732421875, 0.18100738525390625, 0.199127197265625, 0.21724700927734375, 0.2353668212890625, 0.25348663330078125, 0.2716064453125, 0.28972625732421875, 0.3078460693359375, 0.32596588134765625, 0.344085693359375, 0.36220550537109375, 0.3803253173828125, 0.39844512939453125, 0.41656494140625, 0.43468475341796875, 0.4528045654296875, 0.47092437744140625, 0.489044189453125, 0.5071640014648438, 0.5252838134765625, 0.5434036254882812, 0.5615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 12.0, 12.0, 17.0, 19.0, 15.0, 18.0, 26.0, 23.0, 36.0, 37.0, 38.0, 30.0, 34.0, 38.0, 36.0, 33.0, 53.0, 43.0, 51.0, 42.0, 53.0, 32.0, 37.0, 40.0, 35.0, 19.0, 25.0, 21.0, 20.0, 20.0, 17.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.63134765625, -0.6109695434570312, -0.5905914306640625, -0.5702133178710938, -0.549835205078125, -0.5294570922851562, -0.5090789794921875, -0.48870086669921875, -0.46832275390625, -0.44794464111328125, -0.4275665283203125, -0.40718841552734375, -0.386810302734375, -0.36643218994140625, -0.3460540771484375, -0.32567596435546875, -0.3052978515625, -0.28491973876953125, -0.2645416259765625, -0.24416351318359375, -0.223785400390625, -0.20340728759765625, -0.1830291748046875, -0.16265106201171875, -0.14227294921875, -0.12189483642578125, -0.1015167236328125, -0.08113861083984375, -0.060760498046875, -0.04038238525390625, -0.0200042724609375, 0.00037384033203125, 0.020751953125, 0.04113006591796875, 0.0615081787109375, 0.08188629150390625, 0.102264404296875, 0.12264251708984375, 0.1430206298828125, 0.16339874267578125, 0.18377685546875, 0.20415496826171875, 0.2245330810546875, 0.24491119384765625, 0.265289306640625, 0.28566741943359375, 0.3060455322265625, 0.32642364501953125, 0.3468017578125, 0.36717987060546875, 0.3875579833984375, 0.40793609619140625, 0.428314208984375, 0.44869232177734375, 0.4690704345703125, 0.48944854736328125, 0.50982666015625, 0.5302047729492188, 0.5505828857421875, 0.5709609985351562, 0.591339111328125, 0.6117172241210938, 0.6320953369140625, 0.6524734497070312, 0.6728515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 9.0, 20.0, 52.0, 131.0, 489.0, 4846.0, 1032920.0, 9245.0, 548.0, 151.0, 69.0, 25.0, 17.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05799531936645508, -0.056664466857910156, -0.055333614349365234, -0.05400276184082031, -0.05267190933227539, -0.05134105682373047, -0.05001020431518555, -0.048679351806640625, -0.0473484992980957, -0.04601764678955078, -0.04468679428100586, -0.04335594177246094, -0.042025089263916016, -0.040694236755371094, -0.03936338424682617, -0.03803253173828125, -0.03670167922973633, -0.035370826721191406, -0.034039974212646484, -0.03270912170410156, -0.03137826919555664, -0.03004741668701172, -0.028716564178466797, -0.027385711669921875, -0.026054859161376953, -0.02472400665283203, -0.02339315414428711, -0.022062301635742188, -0.020731449127197266, -0.019400596618652344, -0.018069744110107422, -0.0167388916015625, -0.015408039093017578, -0.014077186584472656, -0.012746334075927734, -0.011415481567382812, -0.01008462905883789, -0.008753776550292969, -0.007422924041748047, -0.006092071533203125, -0.004761219024658203, -0.0034303665161132812, -0.0020995140075683594, -0.0007686614990234375, 0.0005621910095214844, 0.0018930435180664062, 0.003223896026611328, 0.00455474853515625, 0.005885601043701172, 0.007216453552246094, 0.008547306060791016, 0.009878158569335938, 0.01120901107788086, 0.012539863586425781, 0.013870716094970703, 0.015201568603515625, 0.016532421112060547, 0.01786327362060547, 0.01919412612915039, 0.020524978637695312, 0.021855831146240234, 0.023186683654785156, 0.024517536163330078, 0.025848388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 28.0, 31.0, 65.0, 88.0, 117.0, 126.0, 103.0, 117.0, 78.0, 73.0, 40.0, 34.0, 17.0, 14.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.350688636302948e-06, -6.144866347312927e-06, -5.9390440583229065e-06, -5.733221769332886e-06, -5.527399480342865e-06, -5.321577191352844e-06, -5.1157549023628235e-06, -4.909932613372803e-06, -4.704110324382782e-06, -4.498288035392761e-06, -4.2924657464027405e-06, -4.08664345741272e-06, -3.880821168422699e-06, -3.6749988794326782e-06, -3.4691765904426575e-06, -3.2633543014526367e-06, -3.057532012462616e-06, -2.8517097234725952e-06, -2.6458874344825745e-06, -2.4400651454925537e-06, -2.234242856502533e-06, -2.028420567512512e-06, -1.8225982785224915e-06, -1.6167759895324707e-06, -1.41095370054245e-06, -1.2051314115524292e-06, -9.993091225624084e-07, -7.934868335723877e-07, -5.876645445823669e-07, -3.818422555923462e-07, -1.7601996660232544e-07, 2.9802322387695312e-08, 2.3562461137771606e-07, 4.414469003677368e-07, 6.472691893577576e-07, 8.530914783477783e-07, 1.058913767337799e-06, 1.2647360563278198e-06, 1.4705583453178406e-06, 1.6763806343078613e-06, 1.882202923297882e-06, 2.088025212287903e-06, 2.2938475012779236e-06, 2.4996697902679443e-06, 2.705492079257965e-06, 2.911314368247986e-06, 3.1171366572380066e-06, 3.3229589462280273e-06, 3.528781235218048e-06, 3.734603524208069e-06, 3.94042581319809e-06, 4.14624810218811e-06, 4.352070391178131e-06, 4.557892680168152e-06, 4.763714969158173e-06, 4.969537258148193e-06, 5.175359547138214e-06, 5.381181836128235e-06, 5.587004125118256e-06, 5.792826414108276e-06, 5.998648703098297e-06, 6.204470992088318e-06, 6.410293281078339e-06, 6.616115570068359e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 11.0, 15.0, 18.0, 17.0, 28.0, 74.0, 117.0, 230.0, 530.0, 1195.0, 3029.0, 10624.0, 76234.0, 911645.0, 33979.0, 6932.0, 2109.0, 876.0, 378.0, 199.0, 97.0, 61.0, 24.0, 22.0, 17.0, 10.0, 12.0, 8.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006771087646484375, -0.006514012813568115, -0.0062569379806518555, -0.005999863147735596, -0.005742788314819336, -0.005485713481903076, -0.005228638648986816, -0.004971563816070557, -0.004714488983154297, -0.004457414150238037, -0.004200339317321777, -0.003943264484405518, -0.003686189651489258, -0.003429114818572998, -0.0031720399856567383, -0.0029149651527404785, -0.0026578903198242188, -0.002400815486907959, -0.0021437406539916992, -0.0018866658210754395, -0.0016295909881591797, -0.00137251615524292, -0.0011154413223266602, -0.0008583664894104004, -0.0006012916564941406, -0.00034421682357788086, -8.71419906616211e-05, 0.00016993284225463867, 0.00042700767517089844, 0.0006840825080871582, 0.000941157341003418, 0.0011982321739196777, 0.0014553070068359375, 0.0017123818397521973, 0.001969456672668457, 0.002226531505584717, 0.0024836063385009766, 0.0027406811714172363, 0.002997756004333496, 0.003254830837249756, 0.0035119056701660156, 0.0037689805030822754, 0.004026055335998535, 0.004283130168914795, 0.004540205001831055, 0.0047972798347473145, 0.005054354667663574, 0.005311429500579834, 0.005568504333496094, 0.0058255791664123535, 0.006082653999328613, 0.006339728832244873, 0.006596803665161133, 0.006853878498077393, 0.007110953330993652, 0.007368028163909912, 0.007625102996826172, 0.007882177829742432, 0.008139252662658691, 0.008396327495574951, 0.008653402328491211, 0.00891047716140747, 0.00916755199432373, 0.00942462682723999, 0.00968170166015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 7.0, 12.0, 8.0, 13.0, 25.0, 36.0, 61.0, 111.0, 208.0, 233.0, 117.0, 63.0, 32.0, 24.0, 21.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0107574462890625, -0.010528534650802612, -0.010299623012542725, -0.010070711374282837, -0.00984179973602295, -0.009612888097763062, -0.009383976459503174, -0.009155064821243286, -0.008926153182983398, -0.00869724154472351, -0.008468329906463623, -0.008239418268203735, -0.008010506629943848, -0.00778159499168396, -0.007552683353424072, -0.007323771715164185, -0.007094860076904297, -0.006865948438644409, -0.0066370368003845215, -0.006408125162124634, -0.006179213523864746, -0.005950301885604858, -0.005721390247344971, -0.005492478609085083, -0.005263566970825195, -0.005034655332565308, -0.00480574369430542, -0.004576832056045532, -0.0043479204177856445, -0.004119008779525757, -0.003890097141265869, -0.0036611855030059814, -0.0034322738647460938, -0.003203362226486206, -0.0029744505882263184, -0.0027455389499664307, -0.002516627311706543, -0.0022877156734466553, -0.0020588040351867676, -0.0018298923969268799, -0.0016009807586669922, -0.0013720691204071045, -0.0011431574821472168, -0.0009142458438873291, -0.0006853342056274414, -0.0004564225673675537, -0.00022751092910766602, 1.4007091522216797e-06, 0.00023031234741210938, 0.00045922398567199707, 0.0006881356239318848, 0.0009170472621917725, 0.0011459589004516602, 0.0013748705387115479, 0.0016037821769714355, 0.0018326938152313232, 0.002061605453491211, 0.0022905170917510986, 0.0025194287300109863, 0.002748340368270874, 0.0029772520065307617, 0.0032061636447906494, 0.003435075283050537, 0.003663986921310425, 0.0038928985595703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 14.0, 17.0, 58.0, 483.0, 295.0, 81.0, 31.0, 17.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.689971923828125, -22.160972595214844, -21.631973266601562, -21.10297203063965, -20.573972702026367, -20.044973373413086, -19.515974044799805, -18.986974716186523, -18.45797348022461, -17.928974151611328, -17.399974822998047, -16.870973587036133, -16.34197425842285, -15.81297492980957, -15.283975601196289, -14.754976272583008, -14.225976943969727, -13.696977615356445, -13.167977333068848, -12.638978004455566, -12.109977722167969, -11.580978393554688, -11.051979064941406, -10.522979736328125, -9.993979454040527, -9.464980125427246, -8.935979843139648, -8.406980514526367, -7.877980709075928, -7.348980903625488, -6.819981575012207, -6.290981769561768, -5.761983871459961, -5.2329840660095215, -4.703984260559082, -4.174984931945801, -3.6459851264953613, -3.116985321044922, -2.5879857540130615, -2.058986186981201, -1.5299863815307617, -1.0009866952896118, -0.4719870090484619, 0.05701267719268799, 0.5860123634338379, 1.1150121688842773, 1.6440117359161377, 2.173011302947998, 2.7020111083984375, 3.231010913848877, 3.7600104808807373, 4.289010047912598, 4.818009853363037, 5.347009658813477, 5.876008987426758, 6.405008792877197, 6.934008598327637, 7.463008403778076, 7.992008209228516, 8.521007537841797, 9.050006866455078, 9.579007148742676, 10.108006477355957, 10.637006759643555, 11.166006088256836]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 16.0, 28.0, 37.0, 70.0, 99.0, 133.0, 177.0, 160.0, 107.0, 54.0, 38.0, 18.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.262331008911133, -8.761574745178223, -8.260818481445312, -7.760062217712402, -7.259305953979492, -6.758549690246582, -6.25779390335083, -5.75703763961792, -5.25628137588501, -4.7555251121521, -4.2547688484191895, -3.7540128231048584, -3.2532565593719482, -2.752500295639038, -2.251744270324707, -1.7509880065917969, -1.2502317428588867, -0.7494755387306213, -0.24871933460235596, 0.25203680992126465, 0.7527930736541748, 1.253549337387085, 1.754305362701416, 2.255061626434326, 2.7558178901672363, 3.2565741539001465, 3.7573304176330566, 4.258086204528809, 4.758842468261719, 5.259598731994629, 5.760354995727539, 6.261111259460449, 6.761867523193359, 7.2626237869262695, 7.76338005065918, 8.26413631439209, 8.764892578125, 9.26564884185791, 9.76640510559082, 10.267160415649414, 10.76791763305664, 11.26867389678955, 11.769430160522461, 12.270186424255371, 12.770942687988281, 13.271698951721191, 13.772455215454102, 14.273210525512695, 14.773966789245605, 15.274723052978516, 15.775479316711426, 16.276235580444336, 16.77699089050293, 17.277748107910156, 17.77850341796875, 18.279260635375977, 18.78001594543457, 19.280771255493164, 19.78152847290039, 20.282283782958984, 20.78304100036621, 21.283796310424805, 21.78455352783203, 22.285308837890625, 22.78606605529785]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 11.0, 8.0, 23.0, 44.0, 54.0, 103.0, 163.0, 350.0, 999.0, 11295.0, 4176424.0, 3838.0, 674.0, 180.0, 58.0, 27.0, 10.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.9375, -78.09130859375, -76.2451171875, -74.39892578125, -72.552734375, -70.70654296875, -68.8603515625, -67.01416015625, -65.16796875, -63.32177734375, -61.4755859375, -59.62939453125, -57.783203125, -55.93701171875, -54.0908203125, -52.24462890625, -50.3984375, -48.55224609375, -46.7060546875, -44.85986328125, -43.013671875, -41.16748046875, -39.3212890625, -37.47509765625, -35.62890625, -33.78271484375, -31.9365234375, -30.09033203125, -28.244140625, -26.39794921875, -24.5517578125, -22.70556640625, -20.859375, -19.01318359375, -17.1669921875, -15.32080078125, -13.474609375, -11.62841796875, -9.7822265625, -7.93603515625, -6.08984375, -4.24365234375, -2.3974609375, -0.55126953125, 1.294921875, 3.14111328125, 4.9873046875, 6.83349609375, 8.6796875, 10.52587890625, 12.3720703125, 14.21826171875, 16.064453125, 17.91064453125, 19.7568359375, 21.60302734375, 23.44921875, 25.29541015625, 27.1416015625, 28.98779296875, 30.833984375, 32.68017578125, 34.5263671875, 36.37255859375, 38.21875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 49.0, 821.0, 26.0, 20.0, 16.0, 7.0, 6.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7322006225585938, -0.7148895263671875, -0.6975784301757812, -0.680267333984375, -0.6629562377929688, -0.6456451416015625, -0.6283340454101562, -0.61102294921875, -0.5937118530273438, -0.5764007568359375, -0.5590896606445312, -0.541778564453125, -0.5244674682617188, -0.5071563720703125, -0.48984527587890625, -0.4725341796875, -0.45522308349609375, -0.4379119873046875, -0.42060089111328125, -0.403289794921875, -0.38597869873046875, -0.3686676025390625, -0.35135650634765625, -0.33404541015625, -0.31673431396484375, -0.2994232177734375, -0.28211212158203125, -0.264801025390625, -0.24748992919921875, -0.2301788330078125, -0.21286773681640625, -0.195556640625, -0.17824554443359375, -0.1609344482421875, -0.14362335205078125, -0.126312255859375, -0.10900115966796875, -0.0916900634765625, -0.07437896728515625, -0.05706787109375, -0.03975677490234375, -0.0224456787109375, -0.00513458251953125, 0.012176513671875, 0.02948760986328125, 0.0467987060546875, 0.06410980224609375, 0.0814208984375, 0.09873199462890625, 0.1160430908203125, 0.13335418701171875, 0.150665283203125, 0.16797637939453125, 0.1852874755859375, 0.20259857177734375, 0.21990966796875, 0.23722076416015625, 0.2545318603515625, 0.27184295654296875, 0.289154052734375, 0.30646514892578125, 0.3237762451171875, 0.34108734130859375, 0.3583984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 17.0, 10.0, 23.0, 36.0, 37.0, 69.0, 88.0, 150.0, 310.0, 554.0, 1021.0, 2145.0, 4729.0, 11657.0, 36460.0, 3933214.0, 159742.0, 27129.0, 9175.0, 3925.0, 1732.0, 900.0, 478.0, 252.0, 138.0, 84.0, 49.0, 39.0, 31.0, 17.0, 15.0, 15.0, 14.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.103515625, -2.01904296875, -1.9345703125, -1.85009765625, -1.765625, -1.68115234375, -1.5966796875, -1.51220703125, -1.427734375, -1.34326171875, -1.2587890625, -1.17431640625, -1.08984375, -1.00537109375, -0.9208984375, -0.83642578125, -0.751953125, -0.66748046875, -0.5830078125, -0.49853515625, -0.4140625, -0.32958984375, -0.2451171875, -0.16064453125, -0.076171875, 0.00830078125, 0.0927734375, 0.17724609375, 0.26171875, 0.34619140625, 0.4306640625, 0.51513671875, 0.599609375, 0.68408203125, 0.7685546875, 0.85302734375, 0.9375, 1.02197265625, 1.1064453125, 1.19091796875, 1.275390625, 1.35986328125, 1.4443359375, 1.52880859375, 1.61328125, 1.69775390625, 1.7822265625, 1.86669921875, 1.951171875, 2.03564453125, 2.1201171875, 2.20458984375, 2.2890625, 2.37353515625, 2.4580078125, 2.54248046875, 2.626953125, 2.71142578125, 2.7958984375, 2.88037109375, 2.96484375, 3.04931640625, 3.1337890625, 3.21826171875, 3.302734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 14.0, 12.0, 12.0, 19.0, 21.0, 20.0, 26.0, 35.0, 27.0, 32.0, 3558.0, 68.0, 36.0, 30.0, 22.0, 17.0, 17.0, 12.0, 15.0, 9.0, 12.0, 7.0, 7.0, 8.0, 4.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.438720703125, -0.4274101257324219, -0.41609954833984375, -0.4047889709472656, -0.3934783935546875, -0.3821678161621094, -0.37085723876953125, -0.3595466613769531, -0.348236083984375, -0.3369255065917969, -0.32561492919921875, -0.3143043518066406, -0.3029937744140625, -0.2916831970214844, -0.28037261962890625, -0.2690620422363281, -0.25775146484375, -0.24644088745117188, -0.23513031005859375, -0.22381973266601562, -0.2125091552734375, -0.20119857788085938, -0.18988800048828125, -0.17857742309570312, -0.167266845703125, -0.15595626831054688, -0.14464569091796875, -0.13333511352539062, -0.1220245361328125, -0.11071395874023438, -0.09940338134765625, -0.08809280395507812, -0.0767822265625, -0.06547164916992188, -0.05416107177734375, -0.042850494384765625, -0.0315399169921875, -0.020229339599609375, -0.00891876220703125, 0.002391815185546875, 0.013702392578125, 0.025012969970703125, 0.03632354736328125, 0.047634124755859375, 0.0589447021484375, 0.07025527954101562, 0.08156585693359375, 0.09287643432617188, 0.10418701171875, 0.11549758911132812, 0.12680816650390625, 0.13811874389648438, 0.1494293212890625, 0.16073989868164062, 0.17205047607421875, 0.18336105346679688, 0.194671630859375, 0.20598220825195312, 0.21729278564453125, 0.22860336303710938, 0.2399139404296875, 0.2512245178222656, 0.26253509521484375, 0.2738456726074219, 0.28515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 957.0, 42.0, 8.0, 2.0, 0.0, 1.0], "bins": [-30.43301010131836, -29.91424560546875, -29.39548110961914, -28.87671661376953, -28.357952117919922, -27.839187622070312, -27.320423126220703, -26.801658630371094, -26.282894134521484, -25.764129638671875, -25.245365142822266, -24.726600646972656, -24.207836151123047, -23.689071655273438, -23.170307159423828, -22.65154266357422, -22.132776260375977, -21.614011764526367, -21.095247268676758, -20.57648277282715, -20.05771827697754, -19.53895378112793, -19.02018928527832, -18.501422882080078, -17.98265838623047, -17.46389389038086, -16.94512939453125, -16.42636489868164, -15.907600402832031, -15.388835906982422, -14.870070457458496, -14.351305961608887, -13.832544326782227, -13.313779830932617, -12.795015335083008, -12.276250839233398, -11.757486343383789, -11.23872184753418, -10.719956398010254, -10.201191902160645, -9.682427406311035, -9.163662910461426, -8.644898414611816, -8.126133918762207, -7.6073689460754395, -7.08860445022583, -6.5698394775390625, -6.051074981689453, -5.532310485839844, -5.013545989990234, -4.494781494140625, -3.9760165214538574, -3.457252025604248, -2.9384875297546387, -2.41972279548645, -1.9009580612182617, -1.3821935653686523, -0.8634289503097534, -0.3446643352508545, 0.17410027980804443, 0.6928648948669434, 1.2116293907165527, 1.7303941249847412, 2.2491588592529297, 2.767923355102539]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 32.0, 45.0, 67.0, 124.0, 130.0, 135.0, 126.0, 95.0, 72.0, 48.0, 33.0, 14.0, 13.0, 3.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4376091957092285, -1.3694449663162231, -1.3012807369232178, -1.233116626739502, -1.1649523973464966, -1.0967881679534912, -1.0286240577697754, -0.96045982837677, -0.8922955989837646, -0.8241313695907593, -0.7559671998023987, -0.6878030300140381, -0.6196388006210327, -0.5514745712280273, -0.48331040143966675, -0.41514620184898376, -0.3469820022583008, -0.2788178026676178, -0.21065360307693481, -0.14248940348625183, -0.07432520389556885, -0.006161004304885864, 0.06200319528579712, 0.1301673948764801, 0.19833159446716309, 0.26649579405784607, 0.33465999364852905, 0.40282419323921204, 0.470988392829895, 0.5391526222229004, 0.607316792011261, 0.6754809617996216, 0.743645191192627, 0.8118094205856323, 0.8799735903739929, 0.9481377601623535, 1.0163019895553589, 1.0844662189483643, 1.15263032913208, 1.2207945585250854, 1.2889587879180908, 1.3571230173110962, 1.4252872467041016, 1.4934513568878174, 1.5616155862808228, 1.6297798156738281, 1.697943925857544, 1.7661081552505493, 1.8342723846435547, 1.90243661403656, 1.9706008434295654, 2.0387649536132812, 2.106929302215576, 2.175093412399292, 2.243257522583008, 2.3114218711853027, 2.3795859813690186, 2.4477500915527344, 2.5159144401550293, 2.584078550338745, 2.652242660522461, 2.720407009124756, 2.7885711193084717, 2.8567354679107666, 2.9248995780944824]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 9.0, 11.0, 20.0, 27.0, 20.0, 23.0, 53.0, 67.0, 96.0, 164.0, 283.0, 461.0, 977.0, 2843.0, 13242.0, 995276.0, 27853.0, 4273.0, 1341.0, 582.0, 313.0, 193.0, 150.0, 62.0, 53.0, 38.0, 20.0, 24.0, 17.0, 12.0, 17.0, 5.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0625, -4.9205322265625, -4.778564453125, -4.6365966796875, -4.49462890625, -4.3526611328125, -4.210693359375, -4.0687255859375, -3.9267578125, -3.7847900390625, -3.642822265625, -3.5008544921875, -3.35888671875, -3.2169189453125, -3.074951171875, -2.9329833984375, -2.791015625, -2.6490478515625, -2.507080078125, -2.3651123046875, -2.22314453125, -2.0811767578125, -1.939208984375, -1.7972412109375, -1.6552734375, -1.5133056640625, -1.371337890625, -1.2293701171875, -1.08740234375, -0.9454345703125, -0.803466796875, -0.6614990234375, -0.51953125, -0.3775634765625, -0.235595703125, -0.0936279296875, 0.04833984375, 0.1903076171875, 0.332275390625, 0.4742431640625, 0.6162109375, 0.7581787109375, 0.900146484375, 1.0421142578125, 1.18408203125, 1.3260498046875, 1.468017578125, 1.6099853515625, 1.751953125, 1.8939208984375, 2.035888671875, 2.1778564453125, 2.31982421875, 2.4617919921875, 2.603759765625, 2.7457275390625, 2.8876953125, 3.0296630859375, 3.171630859375, 3.3135986328125, 3.45556640625, 3.5975341796875, 3.739501953125, 3.8814697265625, 4.0234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 19.0, 35.0, 491.0, 382.0, 19.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7177467346191406, -0.7006301879882812, -0.6835136413574219, -0.6663970947265625, -0.6492805480957031, -0.6321640014648438, -0.6150474548339844, -0.597930908203125, -0.5808143615722656, -0.5636978149414062, -0.5465812683105469, -0.5294647216796875, -0.5123481750488281, -0.49523162841796875, -0.4781150817871094, -0.46099853515625, -0.4438819885253906, -0.42676544189453125, -0.4096488952636719, -0.3925323486328125, -0.3754158020019531, -0.35829925537109375, -0.3411827087402344, -0.324066162109375, -0.3069496154785156, -0.28983306884765625, -0.2727165222167969, -0.2555999755859375, -0.23848342895507812, -0.22136688232421875, -0.20425033569335938, -0.1871337890625, -0.17001724243164062, -0.15290069580078125, -0.13578414916992188, -0.1186676025390625, -0.10155105590820312, -0.08443450927734375, -0.06731796264648438, -0.050201416015625, -0.033084869384765625, -0.01596832275390625, 0.001148223876953125, 0.0182647705078125, 0.035381317138671875, 0.05249786376953125, 0.06961441040039062, 0.08673095703125, 0.10384750366210938, 0.12096405029296875, 0.13808059692382812, 0.1551971435546875, 0.17231369018554688, 0.18943023681640625, 0.20654678344726562, 0.223663330078125, 0.24077987670898438, 0.25789642333984375, 0.2750129699707031, 0.2921295166015625, 0.3092460632324219, 0.32636260986328125, 0.3434791564941406, 0.360595703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 13.0, 14.0, 15.0, 30.0, 33.0, 44.0, 78.0, 114.0, 218.0, 433.0, 1162.0, 4514.0, 28276.0, 736721.0, 254946.0, 17060.0, 3081.0, 911.0, 370.0, 177.0, 103.0, 68.0, 39.0, 30.0, 26.0, 20.0, 11.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5523223876953125, -1.492340087890625, -1.4323577880859375, -1.37237548828125, -1.3123931884765625, -1.252410888671875, -1.1924285888671875, -1.1324462890625, -1.0724639892578125, -1.012481689453125, -0.9524993896484375, -0.89251708984375, -0.8325347900390625, -0.772552490234375, -0.7125701904296875, -0.652587890625, -0.5926055908203125, -0.532623291015625, -0.4726409912109375, -0.41265869140625, -0.3526763916015625, -0.292694091796875, -0.2327117919921875, -0.1727294921875, -0.1127471923828125, -0.052764892578125, 0.0072174072265625, 0.06719970703125, 0.1271820068359375, 0.187164306640625, 0.2471466064453125, 0.30712890625, 0.3671112060546875, 0.427093505859375, 0.4870758056640625, 0.54705810546875, 0.6070404052734375, 0.667022705078125, 0.7270050048828125, 0.7869873046875, 0.8469696044921875, 0.906951904296875, 0.9669342041015625, 1.02691650390625, 1.0868988037109375, 1.146881103515625, 1.2068634033203125, 1.266845703125, 1.3268280029296875, 1.386810302734375, 1.4467926025390625, 1.50677490234375, 1.5667572021484375, 1.626739501953125, 1.6867218017578125, 1.7467041015625, 1.8066864013671875, 1.866668701171875, 1.9266510009765625, 1.98663330078125, 2.0466156005859375, 2.106597900390625, 2.1665802001953125, 2.2265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 17.0, 22.0, 19.0, 27.0, 41.0, 43.0, 35.0, 51.0, 48.0, 59.0, 50.0, 50.0, 56.0, 65.0, 50.0, 48.0, 37.0, 41.0, 36.0, 37.0, 26.0, 29.0, 22.0, 15.0, 12.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67626953125, -0.6580314636230469, -0.6397933959960938, -0.6215553283691406, -0.6033172607421875, -0.5850791931152344, -0.5668411254882812, -0.5486030578613281, -0.530364990234375, -0.5121269226074219, -0.49388885498046875, -0.4756507873535156, -0.4574127197265625, -0.4391746520996094, -0.42093658447265625, -0.4026985168457031, -0.38446044921875, -0.3662223815917969, -0.34798431396484375, -0.3297462463378906, -0.3115081787109375, -0.2932701110839844, -0.27503204345703125, -0.2567939758300781, -0.238555908203125, -0.22031784057617188, -0.20207977294921875, -0.18384170532226562, -0.1656036376953125, -0.14736557006835938, -0.12912750244140625, -0.11088943481445312, -0.0926513671875, -0.07441329956054688, -0.05617523193359375, -0.037937164306640625, -0.0196990966796875, -0.001461029052734375, 0.01677703857421875, 0.035015106201171875, 0.053253173828125, 0.07149124145507812, 0.08972930908203125, 0.10796737670898438, 0.1262054443359375, 0.14444351196289062, 0.16268157958984375, 0.18091964721679688, 0.19915771484375, 0.21739578247070312, 0.23563385009765625, 0.2538719177246094, 0.2721099853515625, 0.2903480529785156, 0.30858612060546875, 0.3268241882324219, 0.345062255859375, 0.3633003234863281, 0.38153839111328125, 0.3997764587402344, 0.4180145263671875, 0.4362525939941406, 0.45449066162109375, 0.4727287292480469, 0.490966796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 12.0, 27.0, 32.0, 41.0, 85.0, 146.0, 336.0, 1108.0, 5489.0, 65537.0, 930444.0, 39715.0, 4029.0, 946.0, 281.0, 104.0, 79.0, 53.0, 20.0, 16.0, 20.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.0924224853515625, -0.089813232421875, -0.0872039794921875, -0.0845947265625, -0.0819854736328125, -0.079376220703125, -0.0767669677734375, -0.07415771484375, -0.0715484619140625, -0.068939208984375, -0.0663299560546875, -0.063720703125, -0.0611114501953125, -0.058502197265625, -0.0558929443359375, -0.05328369140625, -0.0506744384765625, -0.048065185546875, -0.0454559326171875, -0.0428466796875, -0.0402374267578125, -0.037628173828125, -0.0350189208984375, -0.03240966796875, -0.0298004150390625, -0.027191162109375, -0.0245819091796875, -0.02197265625, -0.0193634033203125, -0.016754150390625, -0.0141448974609375, -0.01153564453125, -0.0089263916015625, -0.006317138671875, -0.0037078857421875, -0.0010986328125, 0.0015106201171875, 0.004119873046875, 0.0067291259765625, 0.00933837890625, 0.0119476318359375, 0.014556884765625, 0.0171661376953125, 0.019775390625, 0.0223846435546875, 0.024993896484375, 0.0276031494140625, 0.03021240234375, 0.0328216552734375, 0.035430908203125, 0.0380401611328125, 0.0406494140625, 0.0432586669921875, 0.045867919921875, 0.0484771728515625, 0.05108642578125, 0.0536956787109375, 0.056304931640625, 0.0589141845703125, 0.0615234375, 0.0641326904296875, 0.066741943359375, 0.0693511962890625, 0.07196044921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 9.0, 8.0, 14.0, 23.0, 32.0, 26.0, 43.0, 76.0, 108.0, 82.0, 145.0, 113.0, 76.0, 73.0, 60.0, 37.0, 21.0, 14.0, 10.0, 10.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.810761988162994e-06, -6.588175892829895e-06, -6.365589797496796e-06, -6.143003702163696e-06, -5.920417606830597e-06, -5.6978315114974976e-06, -5.475245416164398e-06, -5.252659320831299e-06, -5.0300732254981995e-06, -4.8074871301651e-06, -4.584901034832001e-06, -4.362314939498901e-06, -4.139728844165802e-06, -3.917142748832703e-06, -3.6945566534996033e-06, -3.471970558166504e-06, -3.2493844628334045e-06, -3.026798367500305e-06, -2.804212272167206e-06, -2.5816261768341064e-06, -2.359040081501007e-06, -2.1364539861679077e-06, -1.9138678908348083e-06, -1.691281795501709e-06, -1.4686957001686096e-06, -1.2461096048355103e-06, -1.0235235095024109e-06, -8.009374141693115e-07, -5.783513188362122e-07, -3.557652235031128e-07, -1.3317912817001343e-07, 8.940696716308594e-08, 3.119930624961853e-07, 5.345791578292847e-07, 7.57165253162384e-07, 9.797513484954834e-07, 1.2023374438285828e-06, 1.4249235391616821e-06, 1.6475096344947815e-06, 1.8700957298278809e-06, 2.0926818251609802e-06, 2.3152679204940796e-06, 2.537854015827179e-06, 2.7604401111602783e-06, 2.9830262064933777e-06, 3.205612301826477e-06, 3.4281983971595764e-06, 3.6507844924926758e-06, 3.873370587825775e-06, 4.0959566831588745e-06, 4.318542778491974e-06, 4.541128873825073e-06, 4.763714969158173e-06, 4.986301064491272e-06, 5.208887159824371e-06, 5.431473255157471e-06, 5.65405935049057e-06, 5.8766454458236694e-06, 6.099231541156769e-06, 6.321817636489868e-06, 6.5444037318229675e-06, 6.766989827156067e-06, 6.989575922489166e-06, 7.212162017822266e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 9.0, 10.0, 18.0, 15.0, 45.0, 57.0, 88.0, 228.0, 541.0, 1417.0, 5807.0, 60901.0, 945925.0, 27403.0, 4069.0, 1146.0, 413.0, 193.0, 80.0, 55.0, 44.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.0857391357421875, -0.082916259765625, -0.0800933837890625, -0.0772705078125, -0.0744476318359375, -0.071624755859375, -0.0688018798828125, -0.06597900390625, -0.0631561279296875, -0.060333251953125, -0.0575103759765625, -0.0546875, -0.0518646240234375, -0.049041748046875, -0.0462188720703125, -0.04339599609375, -0.0405731201171875, -0.037750244140625, -0.0349273681640625, -0.0321044921875, -0.0292816162109375, -0.026458740234375, -0.0236358642578125, -0.02081298828125, -0.0179901123046875, -0.015167236328125, -0.0123443603515625, -0.009521484375, -0.0066986083984375, -0.003875732421875, -0.0010528564453125, 0.00177001953125, 0.0045928955078125, 0.007415771484375, 0.0102386474609375, 0.0130615234375, 0.0158843994140625, 0.018707275390625, 0.0215301513671875, 0.02435302734375, 0.0271759033203125, 0.029998779296875, 0.0328216552734375, 0.03564453125, 0.0384674072265625, 0.041290283203125, 0.0441131591796875, 0.04693603515625, 0.0497589111328125, 0.052581787109375, 0.0554046630859375, 0.0582275390625, 0.0610504150390625, 0.063873291015625, 0.0666961669921875, 0.06951904296875, 0.0723419189453125, 0.075164794921875, 0.0779876708984375, 0.080810546875, 0.0836334228515625, 0.086456298828125, 0.0892791748046875, 0.09210205078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 15.0, 10.0, 25.0, 37.0, 50.0, 75.0, 87.0, 138.0, 119.0, 124.0, 82.0, 56.0, 38.0, 28.0, 14.0, 16.0, 7.0, 11.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028110027313232422, -0.027213096618652344, -0.026316165924072266, -0.025419235229492188, -0.02452230453491211, -0.02362537384033203, -0.022728443145751953, -0.021831512451171875, -0.020934581756591797, -0.02003765106201172, -0.01914072036743164, -0.018243789672851562, -0.017346858978271484, -0.016449928283691406, -0.015552997589111328, -0.01465606689453125, -0.013759136199951172, -0.012862205505371094, -0.011965274810791016, -0.011068344116210938, -0.01017141342163086, -0.009274482727050781, -0.008377552032470703, -0.007480621337890625, -0.006583690643310547, -0.005686759948730469, -0.004789829254150391, -0.0038928985595703125, -0.0029959678649902344, -0.0020990371704101562, -0.0012021064758300781, -0.00030517578125, 0.0005917549133300781, 0.0014886856079101562, 0.0023856163024902344, 0.0032825469970703125, 0.004179477691650391, 0.005076408386230469, 0.005973339080810547, 0.006870269775390625, 0.007767200469970703, 0.008664131164550781, 0.00956106185913086, 0.010457992553710938, 0.011354923248291016, 0.012251853942871094, 0.013148784637451172, 0.01404571533203125, 0.014942646026611328, 0.015839576721191406, 0.016736507415771484, 0.017633438110351562, 0.01853036880493164, 0.01942729949951172, 0.020324230194091797, 0.021221160888671875, 0.022118091583251953, 0.02301502227783203, 0.02391195297241211, 0.024808883666992188, 0.025705814361572266, 0.026602745056152344, 0.027499675750732422, 0.0283966064453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 14.0, 160.0, 792.0, 34.0, 8.0, 2.0, 6.0], "bins": [-47.23650360107422, -46.43891906738281, -45.64133071899414, -44.843746185302734, -44.04615783691406, -43.248573303222656, -42.450984954833984, -41.65340042114258, -40.855812072753906, -40.0582275390625, -39.26063919067383, -38.46305465698242, -37.66546630859375, -36.867881774902344, -36.07029342651367, -35.272708892822266, -34.47512435913086, -33.67753982543945, -32.87995147705078, -32.082366943359375, -31.284778594970703, -30.487194061279297, -29.689607620239258, -28.89202117919922, -28.09443473815918, -27.29684829711914, -26.4992618560791, -25.701675415039062, -24.904090881347656, -24.106504440307617, -23.308917999267578, -22.51133155822754, -21.7137451171875, -20.91615867614746, -20.118572235107422, -19.320985794067383, -18.523399353027344, -17.725814819335938, -16.9282283782959, -16.13064193725586, -15.33305549621582, -14.535469055175781, -13.737882614135742, -12.94029712677002, -12.14271068572998, -11.345124244689941, -10.547538757324219, -9.74995231628418, -8.95236587524414, -8.154779434204102, -7.357193470001221, -6.55960750579834, -5.762021064758301, -4.964434623718262, -4.166848659515381, -3.3692626953125, -2.571676015853882, -1.7740898132324219, -0.9765036106109619, -0.17891740798950195, 0.618668794631958, 1.416254997253418, 2.213841199874878, 3.011427164077759, 3.809013605117798]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 12.0, 16.0, 25.0, 23.0, 37.0, 50.0, 61.0, 77.0, 74.0, 94.0, 86.0, 87.0, 84.0, 54.0, 51.0, 41.0, 34.0, 20.0, 22.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.451914310455322, -5.28645133972168, -5.120988845825195, -4.955526351928711, -4.790063381195068, -4.624600410461426, -4.459137916564941, -4.293675422668457, -4.1282124519348145, -3.962749719619751, -3.7972869873046875, -3.631824254989624, -3.4663615226745605, -3.300898790359497, -3.1354360580444336, -2.96997332572937, -2.8045105934143066, -2.639047861099243, -2.4735851287841797, -2.308122396469116, -2.1426596641540527, -1.9771969318389893, -1.8117341995239258, -1.6462714672088623, -1.4808087348937988, -1.3153460025787354, -1.1498832702636719, -0.9844205379486084, -0.8189578056335449, -0.6534950733184814, -0.48803234100341797, -0.3225696086883545, -0.1571063995361328, 0.008356332778930664, 0.17381906509399414, 0.3392817974090576, 0.5047445297241211, 0.6702072620391846, 0.835669994354248, 1.0011327266693115, 1.166595458984375, 1.3320581912994385, 1.497520923614502, 1.6629836559295654, 1.828446388244629, 1.9939091205596924, 2.159371852874756, 2.3248345851898193, 2.490297317504883, 2.6557600498199463, 2.8212227821350098, 2.9866855144500732, 3.1521482467651367, 3.3176109790802, 3.4830737113952637, 3.648536443710327, 3.8139991760253906, 3.979461908340454, 4.144924640655518, 4.31038761138916, 4.4758501052856445, 4.641312599182129, 4.8067755699157715, 4.972238540649414, 5.137701034545898]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 16.0, 51.0, 57.0, 98.0, 248.0, 505.0, 3050.0, 4179897.0, 9364.0, 776.0, 172.0, 31.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.4306640625, -34.580078125, -33.7294921875, -32.87890625, -32.0283203125, -31.177734375, -30.3271484375, -29.4765625, -28.6259765625, -27.775390625, -26.9248046875, -26.07421875, -25.2236328125, -24.373046875, -23.5224609375, -22.671875, -21.8212890625, -20.970703125, -20.1201171875, -19.26953125, -18.4189453125, -17.568359375, -16.7177734375, -15.8671875, -15.0166015625, -14.166015625, -13.3154296875, -12.46484375, -11.6142578125, -10.763671875, -9.9130859375, -9.0625, -8.2119140625, -7.361328125, -6.5107421875, -5.66015625, -4.8095703125, -3.958984375, -3.1083984375, -2.2578125, -1.4072265625, -0.556640625, 0.2939453125, 1.14453125, 1.9951171875, 2.845703125, 3.6962890625, 4.546875, 5.3974609375, 6.248046875, 7.0986328125, 7.94921875, 8.7998046875, 9.650390625, 10.5009765625, 11.3515625, 12.2021484375, 13.052734375, 13.9033203125, 14.75390625, 15.6044921875, 16.455078125, 17.3056640625, 18.15625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 21.0, 52.0, 745.0, 108.0, 31.0, 13.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.7061920166015625, -0.689239501953125, -0.6722869873046875, -0.65533447265625, -0.6383819580078125, -0.621429443359375, -0.6044769287109375, -0.5875244140625, -0.5705718994140625, -0.553619384765625, -0.5366668701171875, -0.51971435546875, -0.5027618408203125, -0.485809326171875, -0.4688568115234375, -0.451904296875, -0.4349517822265625, -0.417999267578125, -0.4010467529296875, -0.38409423828125, -0.3671417236328125, -0.350189208984375, -0.3332366943359375, -0.3162841796875, -0.2993316650390625, -0.282379150390625, -0.2654266357421875, -0.24847412109375, -0.2315216064453125, -0.214569091796875, -0.1976165771484375, -0.1806640625, -0.1637115478515625, -0.146759033203125, -0.1298065185546875, -0.11285400390625, -0.0959014892578125, -0.078948974609375, -0.0619964599609375, -0.0450439453125, -0.0280914306640625, -0.011138916015625, 0.0058135986328125, 0.02276611328125, 0.0397186279296875, 0.056671142578125, 0.0736236572265625, 0.090576171875, 0.1075286865234375, 0.124481201171875, 0.1414337158203125, 0.15838623046875, 0.1753387451171875, 0.192291259765625, 0.2092437744140625, 0.2261962890625, 0.2431488037109375, 0.260101318359375, 0.2770538330078125, 0.29400634765625, 0.3109588623046875, 0.327911376953125, 0.3448638916015625, 0.36181640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 12.0, 14.0, 15.0, 15.0, 27.0, 36.0, 52.0, 75.0, 145.0, 413.0, 1898.0, 17462.0, 4020071.0, 145773.0, 6373.0, 1075.0, 299.0, 146.0, 71.0, 58.0, 47.0, 39.0, 31.0, 27.0, 13.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.11383056640625, -3.9659423828125, -3.81805419921875, -3.670166015625, -3.52227783203125, -3.3743896484375, -3.22650146484375, -3.07861328125, -2.93072509765625, -2.7828369140625, -2.63494873046875, -2.487060546875, -2.33917236328125, -2.1912841796875, -2.04339599609375, -1.8955078125, -1.74761962890625, -1.5997314453125, -1.45184326171875, -1.303955078125, -1.15606689453125, -1.0081787109375, -0.86029052734375, -0.71240234375, -0.56451416015625, -0.4166259765625, -0.26873779296875, -0.120849609375, 0.02703857421875, 0.1749267578125, 0.32281494140625, 0.470703125, 0.61859130859375, 0.7664794921875, 0.91436767578125, 1.062255859375, 1.21014404296875, 1.3580322265625, 1.50592041015625, 1.65380859375, 1.80169677734375, 1.9495849609375, 2.09747314453125, 2.245361328125, 2.39324951171875, 2.5411376953125, 2.68902587890625, 2.8369140625, 2.98480224609375, 3.1326904296875, 3.28057861328125, 3.428466796875, 3.57635498046875, 3.7242431640625, 3.87213134765625, 4.02001953125, 4.16790771484375, 4.3157958984375, 4.46368408203125, 4.611572265625, 4.75946044921875, 4.9073486328125, 5.05523681640625, 5.203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 3.0, 10.0, 9.0, 13.0, 19.0, 11.0, 23.0, 18.0, 31.0, 27.0, 29.0, 42.0, 50.0, 58.0, 91.0, 180.0, 2791.0, 247.0, 100.0, 69.0, 44.0, 42.0, 31.0, 30.0, 18.0, 11.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.389892578125, -0.3789520263671875, -0.368011474609375, -0.3570709228515625, -0.34613037109375, -0.3351898193359375, -0.324249267578125, -0.3133087158203125, -0.3023681640625, -0.2914276123046875, -0.280487060546875, -0.2695465087890625, -0.25860595703125, -0.2476654052734375, -0.236724853515625, -0.2257843017578125, -0.21484375, -0.2039031982421875, -0.192962646484375, -0.1820220947265625, -0.17108154296875, -0.1601409912109375, -0.149200439453125, -0.1382598876953125, -0.1273193359375, -0.1163787841796875, -0.105438232421875, -0.0944976806640625, -0.08355712890625, -0.0726165771484375, -0.061676025390625, -0.0507354736328125, -0.039794921875, -0.0288543701171875, -0.017913818359375, -0.0069732666015625, 0.00396728515625, 0.0149078369140625, 0.025848388671875, 0.0367889404296875, 0.0477294921875, 0.0586700439453125, 0.069610595703125, 0.0805511474609375, 0.09149169921875, 0.1024322509765625, 0.113372802734375, 0.1243133544921875, 0.13525390625, 0.1461944580078125, 0.157135009765625, 0.1680755615234375, 0.17901611328125, 0.1899566650390625, 0.200897216796875, 0.2118377685546875, 0.2227783203125, 0.2337188720703125, 0.244659423828125, 0.2555999755859375, 0.26654052734375, 0.2774810791015625, 0.288421630859375, 0.2993621826171875, 0.310302734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 38.0, 685.0, 239.0, 26.0, 5.0, 3.0, 1.0, 1.0], "bins": [-11.203322410583496, -11.009543418884277, -10.815765380859375, -10.621986389160156, -10.428207397460938, -10.234429359436035, -10.040650367736816, -9.846872329711914, -9.653093338012695, -9.459314346313477, -9.265536308288574, -9.071757316589355, -8.877979278564453, -8.684200286865234, -8.490421295166016, -8.296643257141113, -8.102864265441895, -7.909085750579834, -7.715307235717773, -7.521528244018555, -7.327749729156494, -7.133971214294434, -6.940192222595215, -6.746413707733154, -6.552635192871094, -6.358856678009033, -6.165078163146973, -5.971299171447754, -5.777520656585693, -5.583742141723633, -5.389963150024414, -5.1961846351623535, -5.002406120300293, -4.808627605438232, -4.614849090576172, -4.421070098876953, -4.227291584014893, -4.033513069152832, -3.8397343158721924, -3.6459555625915527, -3.452176809310913, -3.2583980560302734, -3.064619541168213, -2.8708410263061523, -2.6770622730255127, -2.483283519744873, -2.2895050048828125, -2.095726490020752, -1.9019477367401123, -1.7081691026687622, -1.514390468597412, -1.320611834526062, -1.126833200454712, -0.9330545663833618, -0.7392759323120117, -0.5454972982406616, -0.3517186641693115, -0.15794003009796143, 0.03583860397338867, 0.22961723804473877, 0.42339587211608887, 0.617174506187439, 0.8109531402587891, 1.0047317743301392, 1.1985104084014893]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 20.0, 17.0, 39.0, 59.0, 90.0, 105.0, 115.0, 108.0, 124.0, 103.0, 70.0, 57.0, 37.0, 18.0, 13.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40962553024292, -2.3139803409576416, -2.2183351516723633, -2.122690200805664, -2.0270450115203857, -1.9313998222351074, -1.835754632949829, -1.7401094436645508, -1.6444642543792725, -1.5488190650939941, -1.4531739950180054, -1.357528805732727, -1.2618836164474487, -1.16623854637146, -1.0705933570861816, -0.9749481678009033, -0.8793030977249146, -0.783657968044281, -0.6880127787590027, -0.5923676490783691, -0.4967224895954132, -0.4010773301124573, -0.30543220043182373, -0.2097870111465454, -0.11414188146591187, -0.01849672943353653, 0.0771484225988388, 0.17279356718063354, 0.2684387266635895, 0.3640838861465454, 0.45972901582717896, 0.5553742051124573, 0.6510193347930908, 0.7466644644737244, 0.8423096537590027, 0.9379547834396362, 1.0335999727249146, 1.1292450428009033, 1.2248902320861816, 1.32053542137146, 1.4161806106567383, 1.5118257999420166, 1.6074708700180054, 1.7031160593032837, 1.798761248588562, 1.8944063186645508, 1.990051507949829, 2.0856966972351074, 2.1813416481018066, 2.276986837387085, 2.3726320266723633, 2.4682769775390625, 2.563922166824341, 2.659567356109619, 2.7552125453948975, 2.850857734680176, 2.946502923965454, 3.0421481132507324, 3.1377933025360107, 3.233438491821289, 3.3290834426879883, 3.4247286319732666, 3.520373821258545, 3.6160190105438232, 3.7116641998291016]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 7.0, 3.0, 7.0, 12.0, 18.0, 15.0, 14.0, 30.0, 52.0, 67.0, 76.0, 123.0, 206.0, 374.0, 613.0, 1310.0, 3806.0, 27881.0, 994686.0, 13800.0, 2895.0, 1092.0, 558.0, 316.0, 159.0, 144.0, 75.0, 50.0, 40.0, 25.0, 20.0, 17.0, 13.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.802734375, -3.692138671875, -3.58154296875, -3.470947265625, -3.3603515625, -3.249755859375, -3.13916015625, -3.028564453125, -2.91796875, -2.807373046875, -2.69677734375, -2.586181640625, -2.4755859375, -2.364990234375, -2.25439453125, -2.143798828125, -2.033203125, -1.922607421875, -1.81201171875, -1.701416015625, -1.5908203125, -1.480224609375, -1.36962890625, -1.259033203125, -1.1484375, -1.037841796875, -0.92724609375, -0.816650390625, -0.7060546875, -0.595458984375, -0.48486328125, -0.374267578125, -0.263671875, -0.153076171875, -0.04248046875, 0.068115234375, 0.1787109375, 0.289306640625, 0.39990234375, 0.510498046875, 0.62109375, 0.731689453125, 0.84228515625, 0.952880859375, 1.0634765625, 1.174072265625, 1.28466796875, 1.395263671875, 1.505859375, 1.616455078125, 1.72705078125, 1.837646484375, 1.9482421875, 2.058837890625, 2.16943359375, 2.280029296875, 2.390625, 2.501220703125, 2.61181640625, 2.722412109375, 2.8330078125, 2.943603515625, 3.05419921875, 3.164794921875, 3.275390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 13.0, 34.0, 332.0, 501.0, 73.0, 16.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6583137512207031, -0.6423110961914062, -0.6263084411621094, -0.6103057861328125, -0.5943031311035156, -0.5783004760742188, -0.5622978210449219, -0.546295166015625, -0.5302925109863281, -0.5142898559570312, -0.4982872009277344, -0.4822845458984375, -0.4662818908691406, -0.45027923583984375, -0.4342765808105469, -0.41827392578125, -0.4022712707519531, -0.38626861572265625, -0.3702659606933594, -0.3542633056640625, -0.3382606506347656, -0.32225799560546875, -0.3062553405761719, -0.290252685546875, -0.2742500305175781, -0.25824737548828125, -0.24224472045898438, -0.2262420654296875, -0.21023941040039062, -0.19423675537109375, -0.17823410034179688, -0.1622314453125, -0.14622879028320312, -0.13022613525390625, -0.11422348022460938, -0.0982208251953125, -0.08221817016601562, -0.06621551513671875, -0.050212860107421875, -0.034210205078125, -0.018207550048828125, -0.00220489501953125, 0.013797760009765625, 0.0298004150390625, 0.045803070068359375, 0.06180572509765625, 0.07780838012695312, 0.09381103515625, 0.10981369018554688, 0.12581634521484375, 0.14181900024414062, 0.1578216552734375, 0.17382431030273438, 0.18982696533203125, 0.20582962036132812, 0.221832275390625, 0.23783493041992188, 0.25383758544921875, 0.2698402404785156, 0.2858428955078125, 0.3018455505371094, 0.31784820556640625, 0.3338508605957031, 0.349853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 0.0, 6.0, 4.0, 10.0, 2.0, 7.0, 8.0, 13.0, 16.0, 17.0, 26.0, 28.0, 38.0, 47.0, 58.0, 97.0, 134.0, 228.0, 383.0, 741.0, 2018.0, 8788.0, 104758.0, 869254.0, 52860.0, 5835.0, 1493.0, 644.0, 356.0, 204.0, 138.0, 84.0, 54.0, 48.0, 32.0, 23.0, 22.0, 15.0, 10.0, 13.0, 6.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.592132568359375, -1.53973388671875, -1.487335205078125, -1.4349365234375, -1.382537841796875, -1.33013916015625, -1.277740478515625, -1.225341796875, -1.172943115234375, -1.12054443359375, -1.068145751953125, -1.0157470703125, -0.963348388671875, -0.91094970703125, -0.858551025390625, -0.80615234375, -0.753753662109375, -0.70135498046875, -0.648956298828125, -0.5965576171875, -0.544158935546875, -0.49176025390625, -0.439361572265625, -0.386962890625, -0.334564208984375, -0.28216552734375, -0.229766845703125, -0.1773681640625, -0.124969482421875, -0.07257080078125, -0.020172119140625, 0.0322265625, 0.084625244140625, 0.13702392578125, 0.189422607421875, 0.2418212890625, 0.294219970703125, 0.34661865234375, 0.399017333984375, 0.451416015625, 0.503814697265625, 0.55621337890625, 0.608612060546875, 0.6610107421875, 0.713409423828125, 0.76580810546875, 0.818206787109375, 0.87060546875, 0.923004150390625, 0.97540283203125, 1.027801513671875, 1.0802001953125, 1.132598876953125, 1.18499755859375, 1.237396240234375, 1.289794921875, 1.342193603515625, 1.39459228515625, 1.446990966796875, 1.4993896484375, 1.551788330078125, 1.60418701171875, 1.656585693359375, 1.708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 8.0, 9.0, 14.0, 10.0, 17.0, 20.0, 18.0, 27.0, 26.0, 29.0, 35.0, 32.0, 45.0, 41.0, 39.0, 41.0, 34.0, 39.0, 42.0, 48.0, 43.0, 38.0, 30.0, 34.0, 31.0, 29.0, 23.0, 25.0, 26.0, 19.0, 16.0, 14.0, 21.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.4827423095703125, -0.467437744140625, -0.4521331787109375, -0.43682861328125, -0.4215240478515625, -0.406219482421875, -0.3909149169921875, -0.3756103515625, -0.3603057861328125, -0.345001220703125, -0.3296966552734375, -0.31439208984375, -0.2990875244140625, -0.283782958984375, -0.2684783935546875, -0.253173828125, -0.2378692626953125, -0.222564697265625, -0.2072601318359375, -0.19195556640625, -0.1766510009765625, -0.161346435546875, -0.1460418701171875, -0.1307373046875, -0.1154327392578125, -0.100128173828125, -0.0848236083984375, -0.06951904296875, -0.0542144775390625, -0.038909912109375, -0.0236053466796875, -0.00830078125, 0.0070037841796875, 0.022308349609375, 0.0376129150390625, 0.05291748046875, 0.0682220458984375, 0.083526611328125, 0.0988311767578125, 0.1141357421875, 0.1294403076171875, 0.144744873046875, 0.1600494384765625, 0.17535400390625, 0.1906585693359375, 0.205963134765625, 0.2212677001953125, 0.236572265625, 0.2518768310546875, 0.267181396484375, 0.2824859619140625, 0.29779052734375, 0.3130950927734375, 0.328399658203125, 0.3437042236328125, 0.3590087890625, 0.3743133544921875, 0.389617919921875, 0.4049224853515625, 0.42022705078125, 0.4355316162109375, 0.450836181640625, 0.4661407470703125, 0.4814453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 12.0, 12.0, 19.0, 33.0, 27.0, 41.0, 90.0, 118.0, 184.0, 403.0, 1054.0, 3671.0, 24909.0, 779110.0, 222613.0, 12389.0, 2286.0, 707.0, 352.0, 160.0, 109.0, 78.0, 41.0, 34.0, 18.0, 15.0, 11.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2744941711425781, -0.26529693603515625, -0.2560997009277344, -0.2469024658203125, -0.23770523071289062, -0.22850799560546875, -0.21931076049804688, -0.210113525390625, -0.20091629028320312, -0.19171905517578125, -0.18252182006835938, -0.1733245849609375, -0.16412734985351562, -0.15493011474609375, -0.14573287963867188, -0.13653564453125, -0.12733840942382812, -0.11814117431640625, -0.10894393920898438, -0.0997467041015625, -0.09054946899414062, -0.08135223388671875, -0.07215499877929688, -0.062957763671875, -0.053760528564453125, -0.04456329345703125, -0.035366058349609375, -0.0261688232421875, -0.016971588134765625, -0.00777435302734375, 0.001422882080078125, 0.0106201171875, 0.019817352294921875, 0.02901458740234375, 0.038211822509765625, 0.0474090576171875, 0.056606292724609375, 0.06580352783203125, 0.07500076293945312, 0.084197998046875, 0.09339523315429688, 0.10259246826171875, 0.11178970336914062, 0.1209869384765625, 0.13018417358398438, 0.13938140869140625, 0.14857864379882812, 0.15777587890625, 0.16697311401367188, 0.17617034912109375, 0.18536758422851562, 0.1945648193359375, 0.20376205444335938, 0.21295928955078125, 0.22215652465820312, 0.231353759765625, 0.24055099487304688, 0.24974822998046875, 0.2589454650878906, 0.2681427001953125, 0.2773399353027344, 0.28653717041015625, 0.2957344055175781, 0.304931640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 10.0, 15.0, 24.0, 25.0, 29.0, 54.0, 64.0, 103.0, 117.0, 115.0, 108.0, 98.0, 61.0, 32.0, 35.0, 16.0, 17.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4543533325195312e-05, -1.4077872037887573e-05, -1.3612210750579834e-05, -1.3146549463272095e-05, -1.2680888175964355e-05, -1.2215226888656616e-05, -1.1749565601348877e-05, -1.1283904314041138e-05, -1.0818243026733398e-05, -1.035258173942566e-05, -9.88692045211792e-06, -9.42125916481018e-06, -8.955597877502441e-06, -8.489936590194702e-06, -8.024275302886963e-06, -7.558614015579224e-06, -7.092952728271484e-06, -6.627291440963745e-06, -6.161630153656006e-06, -5.695968866348267e-06, -5.230307579040527e-06, -4.764646291732788e-06, -4.298985004425049e-06, -3.8333237171173096e-06, -3.3676624298095703e-06, -2.902001142501831e-06, -2.436339855194092e-06, -1.9706785678863525e-06, -1.5050172805786133e-06, -1.039355993270874e-06, -5.736947059631348e-07, -1.0803341865539551e-07, 3.5762786865234375e-07, 8.23289155960083e-07, 1.2889504432678223e-06, 1.7546117305755615e-06, 2.2202730178833008e-06, 2.68593430519104e-06, 3.1515955924987793e-06, 3.6172568798065186e-06, 4.082918167114258e-06, 4.548579454421997e-06, 5.014240741729736e-06, 5.479902029037476e-06, 5.945563316345215e-06, 6.411224603652954e-06, 6.876885890960693e-06, 7.342547178268433e-06, 7.808208465576172e-06, 8.273869752883911e-06, 8.73953104019165e-06, 9.20519232749939e-06, 9.670853614807129e-06, 1.0136514902114868e-05, 1.0602176189422607e-05, 1.1067837476730347e-05, 1.1533498764038086e-05, 1.1999160051345825e-05, 1.2464821338653564e-05, 1.2930482625961304e-05, 1.3396143913269043e-05, 1.3861805200576782e-05, 1.4327466487884521e-05, 1.479312777519226e-05, 1.52587890625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 19.0, 43.0, 64.0, 79.0, 163.0, 359.0, 991.0, 5172.0, 133943.0, 894274.0, 10755.0, 1640.0, 506.0, 194.0, 106.0, 47.0, 51.0, 33.0, 15.0, 12.0, 5.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5057601928710938, -0.4900360107421875, -0.47431182861328125, -0.458587646484375, -0.44286346435546875, -0.4271392822265625, -0.41141510009765625, -0.39569091796875, -0.37996673583984375, -0.3642425537109375, -0.34851837158203125, -0.332794189453125, -0.31707000732421875, -0.3013458251953125, -0.28562164306640625, -0.2698974609375, -0.25417327880859375, -0.2384490966796875, -0.22272491455078125, -0.207000732421875, -0.19127655029296875, -0.1755523681640625, -0.15982818603515625, -0.14410400390625, -0.12837982177734375, -0.1126556396484375, -0.09693145751953125, -0.081207275390625, -0.06548309326171875, -0.0497589111328125, -0.03403472900390625, -0.018310546875, -0.00258636474609375, 0.0131378173828125, 0.02886199951171875, 0.044586181640625, 0.06031036376953125, 0.0760345458984375, 0.09175872802734375, 0.10748291015625, 0.12320709228515625, 0.1389312744140625, 0.15465545654296875, 0.170379638671875, 0.18610382080078125, 0.2018280029296875, 0.21755218505859375, 0.2332763671875, 0.24900054931640625, 0.2647247314453125, 0.28044891357421875, 0.296173095703125, 0.31189727783203125, 0.3276214599609375, 0.34334564208984375, 0.35906982421875, 0.37479400634765625, 0.3905181884765625, 0.40624237060546875, 0.421966552734375, 0.43769073486328125, 0.4534149169921875, 0.46913909912109375, 0.48486328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 3.0, 5.0, 9.0, 13.0, 17.0, 14.0, 22.0, 27.0, 40.0, 56.0, 89.0, 107.0, 107.0, 111.0, 87.0, 70.0, 58.0, 29.0, 18.0, 19.0, 23.0, 13.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12325859069824219, -0.11895370483398438, -0.11464881896972656, -0.11034393310546875, -0.10603904724121094, -0.10173416137695312, -0.09742927551269531, -0.0931243896484375, -0.08881950378417969, -0.08451461791992188, -0.08020973205566406, -0.07590484619140625, -0.07159996032714844, -0.06729507446289062, -0.06299018859863281, -0.058685302734375, -0.05438041687011719, -0.050075531005859375, -0.04577064514160156, -0.04146575927734375, -0.03716087341308594, -0.032855987548828125, -0.028551101684570312, -0.0242462158203125, -0.019941329956054688, -0.015636444091796875, -0.011331558227539062, -0.00702667236328125, -0.0027217864990234375, 0.001583099365234375, 0.0058879852294921875, 0.01019287109375, 0.014497756958007812, 0.018802642822265625, 0.023107528686523438, 0.02741241455078125, 0.03171730041503906, 0.036022186279296875, 0.04032707214355469, 0.0446319580078125, 0.04893684387207031, 0.053241729736328125, 0.05754661560058594, 0.06185150146484375, 0.06615638732910156, 0.07046127319335938, 0.07476615905761719, 0.079071044921875, 0.08337593078613281, 0.08768081665039062, 0.09198570251464844, 0.09629058837890625, 0.10059547424316406, 0.10490036010742188, 0.10920524597167969, 0.1135101318359375, 0.11781501770019531, 0.12211990356445312, 0.12642478942871094, 0.13072967529296875, 0.13503456115722656, 0.13933944702148438, 0.1436443328857422, 0.14794921875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 767.0, 237.0, 5.0], "bins": [-83.30458068847656, -81.95889282226562, -80.61321258544922, -79.26752471923828, -77.92184448242188, -76.57615661621094, -75.23047637939453, -73.8847885131836, -72.53910827636719, -71.19342041015625, -69.84774017333984, -68.5020523071289, -67.1563720703125, -65.81068420410156, -64.46500396728516, -63.11931610107422, -61.77362823486328, -60.42794418334961, -59.08226013183594, -57.736576080322266, -56.390892028808594, -55.045204162597656, -53.69952392578125, -52.35383605957031, -51.008155822753906, -49.662471771240234, -48.31678771972656, -46.97110366821289, -45.62541961669922, -44.27973175048828, -42.934051513671875, -41.58836364746094, -40.24268341064453, -38.89699935913086, -37.55131530761719, -36.205631256103516, -34.859947204589844, -33.514259338378906, -32.1685791015625, -30.822891235351562, -29.47720718383789, -28.13152313232422, -26.785839080810547, -25.440155029296875, -24.09446907043457, -22.7487850189209, -21.403100967407227, -20.057415008544922, -18.711732864379883, -17.36604881286621, -16.02036476135254, -14.67467975616455, -13.328994750976562, -11.98331069946289, -10.637626647949219, -9.29194164276123, -7.946257591247559, -6.6005730628967285, -5.254888534545898, -3.9092044830322266, -2.5635199546813965, -1.2178354263305664, 0.12784862518310547, 1.4735336303710938, 2.8192179203033447]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 13.0, 18.0, 21.0, 45.0, 53.0, 64.0, 68.0, 86.0, 77.0, 84.0, 75.0, 80.0, 77.0, 70.0, 55.0, 30.0, 26.0, 15.0, 8.0, 11.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881531715393066, -8.656502723693848, -8.431473731994629, -8.20644474029541, -7.981415748596191, -7.756386756896973, -7.531358242034912, -7.306329250335693, -7.081300258636475, -6.856271266937256, -6.631242275238037, -6.406213283538818, -6.181184768676758, -5.956155776977539, -5.73112678527832, -5.506097793579102, -5.281068801879883, -5.056039810180664, -4.831010818481445, -4.605981826782227, -4.380952835083008, -4.155923843383789, -3.9308953285217285, -3.7058663368225098, -3.480837345123291, -3.2558083534240723, -3.0307793617248535, -2.805750608444214, -2.580721616744995, -2.3556926250457764, -2.1306638717651367, -1.905634880065918, -1.6806058883666992, -1.4555768966674805, -1.2305480241775513, -1.005519151687622, -0.7804901599884033, -0.5554611682891846, -0.33043229579925537, -0.10540342330932617, 0.11962556838989258, 0.34465450048446655, 0.5696834325790405, 0.7947123646736145, 1.0197412967681885, 1.2447702884674072, 1.4697991609573364, 1.6948280334472656, 1.9198570251464844, 2.144886016845703, 2.369915008544922, 2.5949437618255615, 2.8199727535247803, 3.045001745223999, 3.2700304985046387, 3.4950594902038574, 3.720088481903076, 3.945117473602295, 4.170146465301514, 4.395175457000732, 4.620203971862793, 4.845232963562012, 5.0702619552612305, 5.295290946960449, 5.520319938659668]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 25.0, 35.0, 57.0, 153.0, 377.0, 3446.0, 4187331.0, 2425.0, 300.0, 72.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.9520263671875, -17.529052734375, -17.1060791015625, -16.68310546875, -16.2601318359375, -15.837158203125, -15.4141845703125, -14.9912109375, -14.5682373046875, -14.145263671875, -13.7222900390625, -13.29931640625, -12.8763427734375, -12.453369140625, -12.0303955078125, -11.607421875, -11.1844482421875, -10.761474609375, -10.3385009765625, -9.91552734375, -9.4925537109375, -9.069580078125, -8.6466064453125, -8.2236328125, -7.8006591796875, -7.377685546875, -6.9547119140625, -6.53173828125, -6.1087646484375, -5.685791015625, -5.2628173828125, -4.83984375, -4.4168701171875, -3.993896484375, -3.5709228515625, -3.14794921875, -2.7249755859375, -2.302001953125, -1.8790283203125, -1.4560546875, -1.0330810546875, -0.610107421875, -0.1871337890625, 0.23583984375, 0.6588134765625, 1.081787109375, 1.5047607421875, 1.927734375, 2.3507080078125, 2.773681640625, 3.1966552734375, 3.61962890625, 4.0426025390625, 4.465576171875, 4.8885498046875, 5.3115234375, 5.7344970703125, 6.157470703125, 6.5804443359375, 7.00341796875, 7.4263916015625, 7.849365234375, 8.2723388671875, 8.6953125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 15.0, 33.0, 227.0, 477.0, 176.0, 35.0, 13.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.713165283203125, -0.69635009765625, -0.679534912109375, -0.6627197265625, -0.645904541015625, -0.62908935546875, -0.612274169921875, -0.595458984375, -0.578643798828125, -0.56182861328125, -0.545013427734375, -0.5281982421875, -0.511383056640625, -0.49456787109375, -0.477752685546875, -0.4609375, -0.444122314453125, -0.42730712890625, -0.410491943359375, -0.3936767578125, -0.376861572265625, -0.36004638671875, -0.343231201171875, -0.326416015625, -0.309600830078125, -0.29278564453125, -0.275970458984375, -0.2591552734375, -0.242340087890625, -0.22552490234375, -0.208709716796875, -0.19189453125, -0.175079345703125, -0.15826416015625, -0.141448974609375, -0.1246337890625, -0.107818603515625, -0.09100341796875, -0.074188232421875, -0.057373046875, -0.040557861328125, -0.02374267578125, -0.006927490234375, 0.0098876953125, 0.026702880859375, 0.04351806640625, 0.060333251953125, 0.0771484375, 0.093963623046875, 0.11077880859375, 0.127593994140625, 0.1444091796875, 0.161224365234375, 0.17803955078125, 0.194854736328125, 0.211669921875, 0.228485107421875, 0.24530029296875, 0.262115478515625, 0.2789306640625, 0.295745849609375, 0.31256103515625, 0.329376220703125, 0.34619140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 6.0, 20.0, 10.0, 28.0, 45.0, 58.0, 139.0, 381.0, 1294.0, 4851.0, 30343.0, 4093876.0, 53959.0, 6754.0, 1572.0, 502.0, 174.0, 76.0, 50.0, 26.0, 19.0, 21.0, 12.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.28515625, -2.2171630859375, -2.149169921875, -2.0811767578125, -2.01318359375, -1.9451904296875, -1.877197265625, -1.8092041015625, -1.7412109375, -1.6732177734375, -1.605224609375, -1.5372314453125, -1.46923828125, -1.4012451171875, -1.333251953125, -1.2652587890625, -1.197265625, -1.1292724609375, -1.061279296875, -0.9932861328125, -0.92529296875, -0.8572998046875, -0.789306640625, -0.7213134765625, -0.6533203125, -0.5853271484375, -0.517333984375, -0.4493408203125, -0.38134765625, -0.3133544921875, -0.245361328125, -0.1773681640625, -0.109375, -0.0413818359375, 0.026611328125, 0.0946044921875, 0.16259765625, 0.2305908203125, 0.298583984375, 0.3665771484375, 0.4345703125, 0.5025634765625, 0.570556640625, 0.6385498046875, 0.70654296875, 0.7745361328125, 0.842529296875, 0.9105224609375, 0.978515625, 1.0465087890625, 1.114501953125, 1.1824951171875, 1.25048828125, 1.3184814453125, 1.386474609375, 1.4544677734375, 1.5224609375, 1.5904541015625, 1.658447265625, 1.7264404296875, 1.79443359375, 1.8624267578125, 1.930419921875, 1.9984130859375, 2.06640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 10.0, 6.0, 9.0, 7.0, 16.0, 12.0, 16.0, 30.0, 36.0, 58.0, 132.0, 2817.0, 594.0, 100.0, 62.0, 30.0, 25.0, 16.0, 12.0, 11.0, 11.0, 3.0, 8.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.299072265625, -0.2896919250488281, -0.28031158447265625, -0.2709312438964844, -0.2615509033203125, -0.2521705627441406, -0.24279022216796875, -0.23340988159179688, -0.224029541015625, -0.21464920043945312, -0.20526885986328125, -0.19588851928710938, -0.1865081787109375, -0.17712783813476562, -0.16774749755859375, -0.15836715698242188, -0.14898681640625, -0.13960647583007812, -0.13022613525390625, -0.12084579467773438, -0.1114654541015625, -0.10208511352539062, -0.09270477294921875, -0.08332443237304688, -0.073944091796875, -0.06456375122070312, -0.05518341064453125, -0.045803070068359375, -0.0364227294921875, -0.027042388916015625, -0.01766204833984375, -0.008281707763671875, 0.0010986328125, 0.010478973388671875, 0.01985931396484375, 0.029239654541015625, 0.0386199951171875, 0.048000335693359375, 0.05738067626953125, 0.06676101684570312, 0.076141357421875, 0.08552169799804688, 0.09490203857421875, 0.10428237915039062, 0.1136627197265625, 0.12304306030273438, 0.13242340087890625, 0.14180374145507812, 0.15118408203125, 0.16056442260742188, 0.16994476318359375, 0.17932510375976562, 0.1887054443359375, 0.19808578491210938, 0.20746612548828125, 0.21684646606445312, 0.226226806640625, 0.23560714721679688, 0.24498748779296875, 0.2543678283691406, 0.2637481689453125, 0.2731285095214844, 0.28250885009765625, 0.2918891906738281, 0.30126953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 51.0, 963.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9768232107162476, -0.5497756600379944, -0.12272810935974121, 0.30431950092315674, 0.7313669919967651, 1.1584144830703735, 1.585462212562561, 2.012509822845459, 2.4395570755004883, 2.8666045665740967, 3.293652057647705, 3.7206997871398926, 4.147747039794922, 4.574794769287109, 5.001842498779297, 5.428890228271484, 5.855937480926514, 6.282985210418701, 6.7100324630737305, 7.137080192565918, 7.5641279220581055, 7.991175174713135, 8.418222427368164, 8.845270156860352, 9.272317886352539, 9.699365615844727, 10.126413345336914, 10.553461074829102, 10.980507850646973, 11.40755558013916, 11.834603309631348, 12.261651039123535, 12.688697814941406, 13.115745544433594, 13.542793273925781, 13.969841003417969, 14.39688777923584, 14.823935508728027, 15.250983238220215, 15.678030967712402, 16.105077743530273, 16.53212547302246, 16.95917320251465, 17.386220932006836, 17.813268661499023, 18.240314483642578, 18.667362213134766, 19.094409942626953, 19.52145767211914, 19.948505401611328, 20.375553131103516, 20.802600860595703, 21.22964859008789, 21.656696319580078, 22.083744049072266, 22.51078987121582, 22.93783950805664, 23.364887237548828, 23.791934967041016, 24.218982696533203, 24.64603042602539, 25.073078155517578, 25.500125885009766, 25.92717170715332, 26.354219436645508]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 21.0, 54.0, 68.0, 107.0, 141.0, 123.0, 134.0, 118.0, 81.0, 47.0, 44.0, 32.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.183340072631836, -2.110987901687622, -2.038635730743408, -1.9662833213806152, -1.8939311504364014, -1.8215789794921875, -1.749226689338684, -1.6768743991851807, -1.6045222282409668, -1.532170057296753, -1.4598177671432495, -1.387465476989746, -1.3151133060455322, -1.2427611351013184, -1.170408844947815, -1.0980565547943115, -1.0257043838500977, -0.953352153301239, -0.8809999227523804, -0.8086476922035217, -0.7362954616546631, -0.6639432311058044, -0.5915910005569458, -0.5192387700080872, -0.4468865394592285, -0.3745343089103699, -0.30218207836151123, -0.2298298478126526, -0.15747761726379395, -0.0851253867149353, -0.01277315616607666, 0.05957907438278198, 0.13193154335021973, 0.20428377389907837, 0.276636004447937, 0.34898823499679565, 0.4213404655456543, 0.49369269609451294, 0.5660449266433716, 0.6383971571922302, 0.7107493877410889, 0.7831016182899475, 0.8554538488388062, 0.9278060793876648, 1.0001583099365234, 1.0725104808807373, 1.1448627710342407, 1.2172150611877441, 1.289567232131958, 1.3619194030761719, 1.4342716932296753, 1.5066239833831787, 1.5789761543273926, 1.6513283252716064, 1.7236806154251099, 1.7960329055786133, 1.8683850765228271, 1.940737247467041, 2.013089656829834, 2.085441827774048, 2.1577939987182617, 2.2301461696624756, 2.3024983406066895, 2.3748507499694824, 2.4472029209136963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 9.0, 8.0, 16.0, 20.0, 30.0, 54.0, 45.0, 79.0, 117.0, 194.0, 353.0, 568.0, 1379.0, 3836.0, 29829.0, 989515.0, 16875.0, 3028.0, 1131.0, 565.0, 330.0, 172.0, 107.0, 86.0, 53.0, 31.0, 28.0, 20.0, 12.0, 8.0, 8.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.166015625, -3.071258544921875, -2.97650146484375, -2.881744384765625, -2.7869873046875, -2.692230224609375, -2.59747314453125, -2.502716064453125, -2.407958984375, -2.313201904296875, -2.21844482421875, -2.123687744140625, -2.0289306640625, -1.934173583984375, -1.83941650390625, -1.744659423828125, -1.64990234375, -1.555145263671875, -1.46038818359375, -1.365631103515625, -1.2708740234375, -1.176116943359375, -1.08135986328125, -0.986602783203125, -0.891845703125, -0.797088623046875, -0.70233154296875, -0.607574462890625, -0.5128173828125, -0.418060302734375, -0.32330322265625, -0.228546142578125, -0.1337890625, -0.039031982421875, 0.05572509765625, 0.150482177734375, 0.2452392578125, 0.339996337890625, 0.43475341796875, 0.529510498046875, 0.624267578125, 0.719024658203125, 0.81378173828125, 0.908538818359375, 1.0032958984375, 1.098052978515625, 1.19281005859375, 1.287567138671875, 1.38232421875, 1.477081298828125, 1.57183837890625, 1.666595458984375, 1.7613525390625, 1.856109619140625, 1.95086669921875, 2.045623779296875, 2.140380859375, 2.235137939453125, 2.32989501953125, 2.424652099609375, 2.5194091796875, 2.614166259765625, 2.70892333984375, 2.803680419921875, 2.8984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 16.0, 147.0, 447.0, 293.0, 47.0, 15.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6756973266601562, -0.6595001220703125, -0.6433029174804688, -0.627105712890625, -0.6109085083007812, -0.5947113037109375, -0.5785140991210938, -0.56231689453125, -0.5461196899414062, -0.5299224853515625, -0.5137252807617188, -0.497528076171875, -0.48133087158203125, -0.4651336669921875, -0.44893646240234375, -0.4327392578125, -0.41654205322265625, -0.4003448486328125, -0.38414764404296875, -0.367950439453125, -0.35175323486328125, -0.3355560302734375, -0.31935882568359375, -0.30316162109375, -0.28696441650390625, -0.2707672119140625, -0.25457000732421875, -0.238372802734375, -0.22217559814453125, -0.2059783935546875, -0.18978118896484375, -0.173583984375, -0.15738677978515625, -0.1411895751953125, -0.12499237060546875, -0.108795166015625, -0.09259796142578125, -0.0764007568359375, -0.06020355224609375, -0.04400634765625, -0.02780914306640625, -0.0116119384765625, 0.00458526611328125, 0.020782470703125, 0.03697967529296875, 0.0531768798828125, 0.06937408447265625, 0.0855712890625, 0.10176849365234375, 0.1179656982421875, 0.13416290283203125, 0.150360107421875, 0.16655731201171875, 0.1827545166015625, 0.19895172119140625, 0.21514892578125, 0.23134613037109375, 0.2475433349609375, 0.26374053955078125, 0.279937744140625, 0.29613494873046875, 0.3123321533203125, 0.32852935791015625, 0.3447265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 27.0, 29.0, 45.0, 39.0, 74.0, 127.0, 206.0, 463.0, 1145.0, 6883.0, 224796.0, 798741.0, 13041.0, 1616.0, 559.0, 268.0, 139.0, 77.0, 46.0, 50.0, 26.0, 22.0, 15.0, 19.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.618927001953125, -2.54644775390625, -2.473968505859375, -2.4014892578125, -2.329010009765625, -2.25653076171875, -2.184051513671875, -2.111572265625, -2.039093017578125, -1.96661376953125, -1.894134521484375, -1.8216552734375, -1.749176025390625, -1.67669677734375, -1.604217529296875, -1.53173828125, -1.459259033203125, -1.38677978515625, -1.314300537109375, -1.2418212890625, -1.169342041015625, -1.09686279296875, -1.024383544921875, -0.951904296875, -0.879425048828125, -0.80694580078125, -0.734466552734375, -0.6619873046875, -0.589508056640625, -0.51702880859375, -0.444549560546875, -0.3720703125, -0.299591064453125, -0.22711181640625, -0.154632568359375, -0.0821533203125, -0.009674072265625, 0.06280517578125, 0.135284423828125, 0.207763671875, 0.280242919921875, 0.35272216796875, 0.425201416015625, 0.4976806640625, 0.570159912109375, 0.64263916015625, 0.715118408203125, 0.78759765625, 0.860076904296875, 0.93255615234375, 1.005035400390625, 1.0775146484375, 1.149993896484375, 1.22247314453125, 1.294952392578125, 1.367431640625, 1.439910888671875, 1.51239013671875, 1.584869384765625, 1.6573486328125, 1.729827880859375, 1.80230712890625, 1.874786376953125, 1.947265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 7.0, 5.0, 14.0, 9.0, 17.0, 17.0, 20.0, 24.0, 26.0, 33.0, 43.0, 49.0, 44.0, 49.0, 58.0, 46.0, 48.0, 52.0, 52.0, 66.0, 50.0, 46.0, 33.0, 30.0, 31.0, 31.0, 29.0, 17.0, 14.0, 10.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6110763549804688, -0.5873870849609375, -0.5636978149414062, -0.540008544921875, -0.5163192749023438, -0.4926300048828125, -0.46894073486328125, -0.44525146484375, -0.42156219482421875, -0.3978729248046875, -0.37418365478515625, -0.350494384765625, -0.32680511474609375, -0.3031158447265625, -0.27942657470703125, -0.2557373046875, -0.23204803466796875, -0.2083587646484375, -0.18466949462890625, -0.160980224609375, -0.13729095458984375, -0.1136016845703125, -0.08991241455078125, -0.06622314453125, -0.04253387451171875, -0.0188446044921875, 0.00484466552734375, 0.028533935546875, 0.05222320556640625, 0.0759124755859375, 0.09960174560546875, 0.123291015625, 0.14698028564453125, 0.1706695556640625, 0.19435882568359375, 0.218048095703125, 0.24173736572265625, 0.2654266357421875, 0.28911590576171875, 0.31280517578125, 0.33649444580078125, 0.3601837158203125, 0.38387298583984375, 0.407562255859375, 0.43125152587890625, 0.4549407958984375, 0.47863006591796875, 0.5023193359375, 0.5260086059570312, 0.5496978759765625, 0.5733871459960938, 0.597076416015625, 0.6207656860351562, 0.6444549560546875, 0.6681442260742188, 0.69183349609375, 0.7155227661132812, 0.7392120361328125, 0.7629013061523438, 0.786590576171875, 0.8102798461914062, 0.8339691162109375, 0.8576583862304688, 0.88134765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 8.0, 6.0, 4.0, 8.0, 14.0, 27.0, 31.0, 60.0, 101.0, 205.0, 560.0, 2577.0, 53870.0, 974102.0, 14871.0, 1363.0, 366.0, 159.0, 95.0, 39.0, 32.0, 16.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.67236328125, -0.6533355712890625, -0.634307861328125, -0.6152801513671875, -0.59625244140625, -0.5772247314453125, -0.558197021484375, -0.5391693115234375, -0.5201416015625, -0.5011138916015625, -0.482086181640625, -0.4630584716796875, -0.44403076171875, -0.4250030517578125, -0.405975341796875, -0.3869476318359375, -0.367919921875, -0.3488922119140625, -0.329864501953125, -0.3108367919921875, -0.29180908203125, -0.2727813720703125, -0.253753662109375, -0.2347259521484375, -0.2156982421875, -0.1966705322265625, -0.177642822265625, -0.1586151123046875, -0.13958740234375, -0.1205596923828125, -0.101531982421875, -0.0825042724609375, -0.0634765625, -0.0444488525390625, -0.025421142578125, -0.0063934326171875, 0.01263427734375, 0.0316619873046875, 0.050689697265625, 0.0697174072265625, 0.0887451171875, 0.1077728271484375, 0.126800537109375, 0.1458282470703125, 0.16485595703125, 0.1838836669921875, 0.202911376953125, 0.2219390869140625, 0.240966796875, 0.2599945068359375, 0.279022216796875, 0.2980499267578125, 0.31707763671875, 0.3361053466796875, 0.355133056640625, 0.3741607666015625, 0.3931884765625, 0.4122161865234375, 0.431243896484375, 0.4502716064453125, 0.46929931640625, 0.4883270263671875, 0.507354736328125, 0.5263824462890625, 0.54541015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 19.0, 20.0, 33.0, 59.0, 129.0, 165.0, 141.0, 155.0, 94.0, 61.0, 35.0, 26.0, 12.0, 10.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.3089349269866943e-05, -2.2396445274353027e-05, -2.170354127883911e-05, -2.1010637283325195e-05, -2.031773328781128e-05, -1.9624829292297363e-05, -1.8931925296783447e-05, -1.823902130126953e-05, -1.7546117305755615e-05, -1.68532133102417e-05, -1.6160309314727783e-05, -1.5467405319213867e-05, -1.4774501323699951e-05, -1.4081597328186035e-05, -1.3388693332672119e-05, -1.2695789337158203e-05, -1.2002885341644287e-05, -1.1309981346130371e-05, -1.0617077350616455e-05, -9.924173355102539e-06, -9.231269359588623e-06, -8.538365364074707e-06, -7.845461368560791e-06, -7.152557373046875e-06, -6.459653377532959e-06, -5.766749382019043e-06, -5.073845386505127e-06, -4.380941390991211e-06, -3.688037395477295e-06, -2.995133399963379e-06, -2.302229404449463e-06, -1.6093254089355469e-06, -9.164214134216309e-07, -2.2351741790771484e-07, 4.6938657760620117e-07, 1.1622905731201172e-06, 1.8551945686340332e-06, 2.5480985641479492e-06, 3.2410025596618652e-06, 3.933906555175781e-06, 4.626810550689697e-06, 5.319714546203613e-06, 6.012618541717529e-06, 6.705522537231445e-06, 7.398426532745361e-06, 8.091330528259277e-06, 8.784234523773193e-06, 9.47713851928711e-06, 1.0170042514801025e-05, 1.0862946510314941e-05, 1.1555850505828857e-05, 1.2248754501342773e-05, 1.294165849685669e-05, 1.3634562492370605e-05, 1.4327466487884521e-05, 1.5020370483398438e-05, 1.5713274478912354e-05, 1.640617847442627e-05, 1.7099082469940186e-05, 1.77919864654541e-05, 1.8484890460968018e-05, 1.9177794456481934e-05, 1.987069845199585e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 10.0, 15.0, 12.0, 25.0, 42.0, 61.0, 117.0, 200.0, 441.0, 1872.0, 17194.0, 952340.0, 70721.0, 3963.0, 855.0, 295.0, 138.0, 86.0, 38.0, 31.0, 22.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.6865234375, -0.6687812805175781, -0.6510391235351562, -0.6332969665527344, -0.6155548095703125, -0.5978126525878906, -0.5800704956054688, -0.5623283386230469, -0.544586181640625, -0.5268440246582031, -0.5091018676757812, -0.4913597106933594, -0.4736175537109375, -0.4558753967285156, -0.43813323974609375, -0.4203910827636719, -0.40264892578125, -0.3849067687988281, -0.36716461181640625, -0.3494224548339844, -0.3316802978515625, -0.3139381408691406, -0.29619598388671875, -0.2784538269042969, -0.260711669921875, -0.24296951293945312, -0.22522735595703125, -0.20748519897460938, -0.1897430419921875, -0.17200088500976562, -0.15425872802734375, -0.13651657104492188, -0.1187744140625, -0.10103225708007812, -0.08329010009765625, -0.06554794311523438, -0.0478057861328125, -0.030063629150390625, -0.01232147216796875, 0.005420684814453125, 0.023162841796875, 0.040904998779296875, 0.05864715576171875, 0.07638931274414062, 0.0941314697265625, 0.11187362670898438, 0.12961578369140625, 0.14735794067382812, 0.16510009765625, 0.18284225463867188, 0.20058441162109375, 0.21832656860351562, 0.2360687255859375, 0.2538108825683594, 0.27155303955078125, 0.2892951965332031, 0.307037353515625, 0.3247795104980469, 0.34252166748046875, 0.3602638244628906, 0.3780059814453125, 0.3957481384277344, 0.41349029541015625, 0.4312324523925781, 0.448974609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 7.0, 10.0, 7.0, 18.0, 29.0, 35.0, 51.0, 70.0, 82.0, 103.0, 127.0, 120.0, 79.0, 75.0, 38.0, 34.0, 26.0, 18.0, 6.0, 13.0, 10.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1480712890625, -0.14200782775878906, -0.13594436645507812, -0.1298809051513672, -0.12381744384765625, -0.11775398254394531, -0.11169052124023438, -0.10562705993652344, -0.0995635986328125, -0.09350013732910156, -0.08743667602539062, -0.08137321472167969, -0.07530975341796875, -0.06924629211425781, -0.06318283081054688, -0.05711936950683594, -0.051055908203125, -0.04499244689941406, -0.038928985595703125, -0.03286552429199219, -0.02680206298828125, -0.020738601684570312, -0.014675140380859375, -0.008611679077148438, -0.0025482177734375, 0.0035152435302734375, 0.009578704833984375, 0.015642166137695312, 0.02170562744140625, 0.027769088745117188, 0.033832550048828125, 0.03989601135253906, 0.04595947265625, 0.05202293395996094, 0.058086395263671875, 0.06414985656738281, 0.07021331787109375, 0.07627677917480469, 0.08234024047851562, 0.08840370178222656, 0.0944671630859375, 0.10053062438964844, 0.10659408569335938, 0.11265754699707031, 0.11872100830078125, 0.12478446960449219, 0.13084793090820312, 0.13691139221191406, 0.142974853515625, 0.14903831481933594, 0.15510177612304688, 0.1611652374267578, 0.16722869873046875, 0.1732921600341797, 0.17935562133789062, 0.18541908264160156, 0.1914825439453125, 0.19754600524902344, 0.20360946655273438, 0.2096729278564453, 0.21573638916015625, 0.2217998504638672, 0.22786331176757812, 0.23392677307128906, 0.239990234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 227.0, 716.0, 43.0, 5.0, 0.0, 1.0], "bins": [-41.116172790527344, -40.42205047607422, -39.72792434692383, -39.0338020324707, -38.33967590332031, -37.64555358886719, -36.95143127441406, -36.25730514526367, -35.56318283081055, -34.86906051635742, -34.17493438720703, -33.480812072753906, -32.786685943603516, -32.09256362915039, -31.398439407348633, -30.704315185546875, -30.010189056396484, -29.316064834594727, -28.62194061279297, -27.927818298339844, -27.233694076538086, -26.539569854736328, -25.84544563293457, -25.151321411132812, -24.457199096679688, -23.76307487487793, -23.068950653076172, -22.374828338623047, -21.68070411682129, -20.98657989501953, -20.292455673217773, -19.598331451416016, -18.904207229614258, -18.2100830078125, -17.515958786010742, -16.821834564208984, -16.12771224975586, -15.433588027954102, -14.739463806152344, -14.045339584350586, -13.351215362548828, -12.65709114074707, -11.962967872619629, -11.268843650817871, -10.574719429016113, -9.880596160888672, -9.186471939086914, -8.492347717285156, -7.798224449157715, -7.104100704193115, -6.409976482391357, -5.715852737426758, -5.021728515625, -4.3276047706604, -3.633481025695801, -2.939356803894043, -2.2452330589294434, -1.5511090755462646, -0.8569852113723755, -0.16286134719848633, 0.5312626361846924, 1.225386619567871, 1.9195103645324707, 2.6136345863342285, 3.307758331298828]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 15.0, 25.0, 27.0, 24.0, 33.0, 36.0, 45.0, 49.0, 54.0, 61.0, 74.0, 69.0, 76.0, 60.0, 56.0, 52.0, 48.0, 31.0, 32.0, 29.0, 24.0, 19.0, 14.0, 6.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.673714637756348, -4.497820854187012, -4.321927070617676, -4.14603328704834, -3.970139503479004, -3.794245719909668, -3.618351936340332, -3.442458152770996, -3.26656436920166, -3.090670585632324, -2.9147768020629883, -2.7388830184936523, -2.5629892349243164, -2.3870954513549805, -2.2112016677856445, -2.0353078842163086, -1.8594141006469727, -1.6835203170776367, -1.5076265335083008, -1.3317327499389648, -1.155838966369629, -0.979945182800293, -0.804051399230957, -0.6281576156616211, -0.45226383209228516, -0.2763700485229492, -0.10047626495361328, 0.07541751861572266, 0.2513113021850586, 0.42720508575439453, 0.6030988693237305, 0.7789926528930664, 0.9548859596252441, 1.13077974319458, 1.306673526763916, 1.482567310333252, 1.658461093902588, 1.8343548774719238, 2.0102486610412598, 2.1861424446105957, 2.3620362281799316, 2.5379300117492676, 2.7138237953186035, 2.8897175788879395, 3.0656113624572754, 3.2415051460266113, 3.4173989295959473, 3.593292713165283, 3.769186496734619, 3.945080280303955, 4.120974063873291, 4.296867847442627, 4.472761631011963, 4.648655414581299, 4.824549198150635, 5.000442981719971, 5.176336765289307, 5.352230548858643, 5.5281243324279785, 5.7040181159973145, 5.87991189956665, 6.055805683135986, 6.231699466705322, 6.407593250274658, 6.583487033843994]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 16.0, 12.0, 23.0, 37.0, 106.0, 201.0, 956.0, 393109.0, 3798517.0, 962.0, 196.0, 65.0, 37.0, 10.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -7.031829833984375, -6.86444091796875, -6.697052001953125, -6.5296630859375, -6.362274169921875, -6.19488525390625, -6.027496337890625, -5.860107421875, -5.692718505859375, -5.52532958984375, -5.357940673828125, -5.1905517578125, -5.023162841796875, -4.85577392578125, -4.688385009765625, -4.52099609375, -4.353607177734375, -4.18621826171875, -4.018829345703125, -3.8514404296875, -3.684051513671875, -3.51666259765625, -3.349273681640625, -3.181884765625, -3.014495849609375, -2.84710693359375, -2.679718017578125, -2.5123291015625, -2.344940185546875, -2.17755126953125, -2.010162353515625, -1.8427734375, -1.675384521484375, -1.50799560546875, -1.340606689453125, -1.1732177734375, -1.005828857421875, -0.83843994140625, -0.671051025390625, -0.503662109375, -0.336273193359375, -0.16888427734375, -0.001495361328125, 0.1658935546875, 0.333282470703125, 0.50067138671875, 0.668060302734375, 0.83544921875, 1.002838134765625, 1.17022705078125, 1.337615966796875, 1.5050048828125, 1.672393798828125, 1.83978271484375, 2.007171630859375, 2.174560546875, 2.341949462890625, 2.50933837890625, 2.676727294921875, 2.8441162109375, 3.011505126953125, 3.17889404296875, 3.346282958984375, 3.513671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 17.0, 102.0, 263.0, 375.0, 163.0, 45.0, 12.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7054595947265625, -0.688751220703125, -0.6720428466796875, -0.65533447265625, -0.6386260986328125, -0.621917724609375, -0.6052093505859375, -0.5885009765625, -0.5717926025390625, -0.555084228515625, -0.5383758544921875, -0.52166748046875, -0.5049591064453125, -0.488250732421875, -0.4715423583984375, -0.454833984375, -0.4381256103515625, -0.421417236328125, -0.4047088623046875, -0.38800048828125, -0.3712921142578125, -0.354583740234375, -0.3378753662109375, -0.3211669921875, -0.3044586181640625, -0.287750244140625, -0.2710418701171875, -0.25433349609375, -0.2376251220703125, -0.220916748046875, -0.2042083740234375, -0.1875, -0.1707916259765625, -0.154083251953125, -0.1373748779296875, -0.12066650390625, -0.1039581298828125, -0.087249755859375, -0.0705413818359375, -0.0538330078125, -0.0371246337890625, -0.020416259765625, -0.0037078857421875, 0.01300048828125, 0.0297088623046875, 0.046417236328125, 0.0631256103515625, 0.079833984375, 0.0965423583984375, 0.113250732421875, 0.1299591064453125, 0.14666748046875, 0.1633758544921875, 0.180084228515625, 0.1967926025390625, 0.2135009765625, 0.2302093505859375, 0.246917724609375, 0.2636260986328125, 0.28033447265625, 0.2970428466796875, 0.313751220703125, 0.3304595947265625, 0.34716796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 24.0, 51.0, 91.0, 204.0, 675.0, 2005.0, 8554.0, 195867.0, 3971307.0, 12140.0, 2263.0, 631.0, 206.0, 110.0, 45.0, 18.0, 15.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.3935394287109375, -1.345672607421875, -1.2978057861328125, -1.24993896484375, -1.2020721435546875, -1.154205322265625, -1.1063385009765625, -1.0584716796875, -1.0106048583984375, -0.962738037109375, -0.9148712158203125, -0.86700439453125, -0.8191375732421875, -0.771270751953125, -0.7234039306640625, -0.675537109375, -0.6276702880859375, -0.579803466796875, -0.5319366455078125, -0.48406982421875, -0.4362030029296875, -0.388336181640625, -0.3404693603515625, -0.2926025390625, -0.2447357177734375, -0.196868896484375, -0.1490020751953125, -0.10113525390625, -0.0532684326171875, -0.005401611328125, 0.0424652099609375, 0.09033203125, 0.1381988525390625, 0.186065673828125, 0.2339324951171875, 0.28179931640625, 0.3296661376953125, 0.377532958984375, 0.4253997802734375, 0.4732666015625, 0.5211334228515625, 0.569000244140625, 0.6168670654296875, 0.66473388671875, 0.7126007080078125, 0.760467529296875, 0.8083343505859375, 0.856201171875, 0.9040679931640625, 0.951934814453125, 0.9998016357421875, 1.04766845703125, 1.0955352783203125, 1.143402099609375, 1.1912689208984375, 1.2391357421875, 1.2870025634765625, 1.334869384765625, 1.3827362060546875, 1.43060302734375, 1.4784698486328125, 1.526336669921875, 1.5742034912109375, 1.6220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 18.0, 38.0, 50.0, 113.0, 1190.0, 2374.0, 114.0, 42.0, 23.0, 19.0, 10.0, 9.0, 2.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3296661376953125, -0.319976806640625, -0.3102874755859375, -0.30059814453125, -0.2909088134765625, -0.281219482421875, -0.2715301513671875, -0.2618408203125, -0.2521514892578125, -0.242462158203125, -0.2327728271484375, -0.22308349609375, -0.2133941650390625, -0.203704833984375, -0.1940155029296875, -0.184326171875, -0.1746368408203125, -0.164947509765625, -0.1552581787109375, -0.14556884765625, -0.1358795166015625, -0.126190185546875, -0.1165008544921875, -0.1068115234375, -0.0971221923828125, -0.087432861328125, -0.0777435302734375, -0.06805419921875, -0.0583648681640625, -0.048675537109375, -0.0389862060546875, -0.029296875, -0.0196075439453125, -0.009918212890625, -0.0002288818359375, 0.00946044921875, 0.0191497802734375, 0.028839111328125, 0.0385284423828125, 0.0482177734375, 0.0579071044921875, 0.067596435546875, 0.0772857666015625, 0.08697509765625, 0.0966644287109375, 0.106353759765625, 0.1160430908203125, 0.125732421875, 0.1354217529296875, 0.145111083984375, 0.1548004150390625, 0.16448974609375, 0.1741790771484375, 0.183868408203125, 0.1935577392578125, 0.2032470703125, 0.2129364013671875, 0.222625732421875, 0.2323150634765625, 0.24200439453125, 0.2516937255859375, 0.261383056640625, 0.2710723876953125, 0.28076171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 60.0, 323.0, 477.0, 88.0, 27.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5450942516326904, -1.488369107246399, -1.4316439628601074, -1.374918818473816, -1.3181936740875244, -1.2614684104919434, -1.2047433853149414, -1.1480181217193604, -1.0912929773330688, -1.0345678329467773, -0.9778426885604858, -0.9211175441741943, -0.8643923401832581, -0.8076671957969666, -0.750942051410675, -0.6942168474197388, -0.637491762638092, -0.5807666182518005, -0.524041473865509, -0.46731629967689514, -0.41059112548828125, -0.35386598110198975, -0.29714083671569824, -0.24041566252708435, -0.18369051814079285, -0.12696535885334015, -0.07024020701646805, -0.013515055179595947, 0.04321010410785675, 0.09993526339530945, 0.15666040778160095, 0.21338558197021484, 0.27011072635650635, 0.32683587074279785, 0.38356104493141174, 0.44028618931770325, 0.49701136350631714, 0.5537365078926086, 0.6104616522789001, 0.6671868562698364, 0.7239120006561279, 0.7806371450424194, 0.8373622894287109, 0.8940874338150024, 0.9508126378059387, 1.007537841796875, 1.064262866973877, 1.120988130569458, 1.17771315574646, 1.2344383001327515, 1.291163444519043, 1.3478885889053345, 1.404613733291626, 1.461338996887207, 1.518064022064209, 1.57478928565979, 1.6315144300460815, 1.688239574432373, 1.7449647188186646, 1.801689863204956, 1.8584150075912476, 1.915140151977539, 1.9718654155731201, 2.028590440750122, 2.085315704345703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 14.0, 16.0, 12.0, 23.0, 20.0, 45.0, 56.0, 57.0, 75.0, 74.0, 83.0, 92.0, 78.0, 69.0, 56.0, 55.0, 42.0, 43.0, 32.0, 13.0, 17.0, 8.0, 10.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8000990748405457, -0.7672092318534851, -0.7343193888664246, -0.701429545879364, -0.6685397028923035, -0.6356498599052429, -0.6027599573135376, -0.569870114326477, -0.5369802713394165, -0.504090428352356, -0.4712005853652954, -0.43831074237823486, -0.4054208993911743, -0.37253105640411377, -0.33964118361473083, -0.3067513406276703, -0.27386152744293213, -0.24097168445587158, -0.20808184146881104, -0.1751919835805893, -0.14230214059352875, -0.1094122976064682, -0.07652243971824646, -0.04363259673118591, -0.010742753744125366, 0.02214709296822548, 0.055036939680576324, 0.08792679011821747, 0.12081663310527802, 0.15370647609233856, 0.1865963339805603, 0.21948617696762085, 0.2523759603500366, 0.28526580333709717, 0.3181556463241577, 0.35104548931121826, 0.3839353322982788, 0.41682517528533936, 0.4497150480747223, 0.48260489106178284, 0.515494704246521, 0.5483845472335815, 0.5812743902206421, 0.6141642332077026, 0.6470540761947632, 0.6799439191818237, 0.7128337621688843, 0.7457236051559448, 0.7786135077476501, 0.8115033507347107, 0.8443931937217712, 0.8772830367088318, 0.9101728796958923, 0.9430627226829529, 0.9759526252746582, 1.0088424682617188, 1.0417323112487793, 1.0746221542358398, 1.1075119972229004, 1.140401840209961, 1.1732916831970215, 1.206181526184082, 1.2390713691711426, 1.2719612121582031, 1.3048510551452637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 8.0, 18.0, 26.0, 26.0, 36.0, 59.0, 89.0, 124.0, 243.0, 419.0, 832.0, 1837.0, 6113.0, 201654.0, 822506.0, 10041.0, 2291.0, 966.0, 486.0, 268.0, 138.0, 84.0, 84.0, 44.0, 28.0, 34.0, 19.0, 8.0, 13.0, 10.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6361541748046875, -1.577972412109375, -1.5197906494140625, -1.46160888671875, -1.4034271240234375, -1.345245361328125, -1.2870635986328125, -1.2288818359375, -1.1707000732421875, -1.112518310546875, -1.0543365478515625, -0.99615478515625, -0.9379730224609375, -0.879791259765625, -0.8216094970703125, -0.763427734375, -0.7052459716796875, -0.647064208984375, -0.5888824462890625, -0.53070068359375, -0.4725189208984375, -0.414337158203125, -0.3561553955078125, -0.2979736328125, -0.2397918701171875, -0.181610107421875, -0.1234283447265625, -0.06524658203125, -0.0070648193359375, 0.051116943359375, 0.1092987060546875, 0.16748046875, 0.2256622314453125, 0.283843994140625, 0.3420257568359375, 0.40020751953125, 0.4583892822265625, 0.516571044921875, 0.5747528076171875, 0.6329345703125, 0.6911163330078125, 0.749298095703125, 0.8074798583984375, 0.86566162109375, 0.9238433837890625, 0.982025146484375, 1.0402069091796875, 1.098388671875, 1.1565704345703125, 1.214752197265625, 1.2729339599609375, 1.33111572265625, 1.3892974853515625, 1.447479248046875, 1.5056610107421875, 1.5638427734375, 1.6220245361328125, 1.680206298828125, 1.7383880615234375, 1.79656982421875, 1.8547515869140625, 1.912933349609375, 1.9711151123046875, 2.029296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 34.0, 162.0, 343.0, 302.0, 98.0, 25.0, 15.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.684326171875, -0.66796875, -0.651611328125, -0.63525390625, -0.618896484375, -0.6025390625, -0.586181640625, -0.56982421875, -0.553466796875, -0.537109375, -0.520751953125, -0.50439453125, -0.488037109375, -0.4716796875, -0.455322265625, -0.43896484375, -0.422607421875, -0.40625, -0.389892578125, -0.37353515625, -0.357177734375, -0.3408203125, -0.324462890625, -0.30810546875, -0.291748046875, -0.275390625, -0.259033203125, -0.24267578125, -0.226318359375, -0.2099609375, -0.193603515625, -0.17724609375, -0.160888671875, -0.14453125, -0.128173828125, -0.11181640625, -0.095458984375, -0.0791015625, -0.062744140625, -0.04638671875, -0.030029296875, -0.013671875, 0.002685546875, 0.01904296875, 0.035400390625, 0.0517578125, 0.068115234375, 0.08447265625, 0.100830078125, 0.1171875, 0.133544921875, 0.14990234375, 0.166259765625, 0.1826171875, 0.198974609375, 0.21533203125, 0.231689453125, 0.248046875, 0.264404296875, 0.28076171875, 0.297119140625, 0.3134765625, 0.329833984375, 0.34619140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 15.0, 15.0, 18.0, 18.0, 13.0, 45.0, 35.0, 42.0, 81.0, 126.0, 248.0, 499.0, 1552.0, 9899.0, 218602.0, 788827.0, 24418.0, 2538.0, 745.0, 321.0, 151.0, 97.0, 62.0, 36.0, 27.0, 15.0, 14.0, 17.0, 14.0, 9.0, 10.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5290985107421875, -1.483001708984375, -1.4369049072265625, -1.39080810546875, -1.3447113037109375, -1.298614501953125, -1.2525177001953125, -1.2064208984375, -1.1603240966796875, -1.114227294921875, -1.0681304931640625, -1.02203369140625, -0.9759368896484375, -0.929840087890625, -0.8837432861328125, -0.837646484375, -0.7915496826171875, -0.745452880859375, -0.6993560791015625, -0.65325927734375, -0.6071624755859375, -0.561065673828125, -0.5149688720703125, -0.4688720703125, -0.4227752685546875, -0.376678466796875, -0.3305816650390625, -0.28448486328125, -0.2383880615234375, -0.192291259765625, -0.1461944580078125, -0.10009765625, -0.0540008544921875, -0.007904052734375, 0.0381927490234375, 0.08428955078125, 0.1303863525390625, 0.176483154296875, 0.2225799560546875, 0.2686767578125, 0.3147735595703125, 0.360870361328125, 0.4069671630859375, 0.45306396484375, 0.4991607666015625, 0.545257568359375, 0.5913543701171875, 0.637451171875, 0.6835479736328125, 0.729644775390625, 0.7757415771484375, 0.82183837890625, 0.8679351806640625, 0.914031982421875, 0.9601287841796875, 1.0062255859375, 1.0523223876953125, 1.098419189453125, 1.1445159912109375, 1.19061279296875, 1.2367095947265625, 1.282806396484375, 1.3289031982421875, 1.375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 3.0, 11.0, 9.0, 6.0, 15.0, 16.0, 11.0, 15.0, 20.0, 27.0, 32.0, 39.0, 44.0, 34.0, 35.0, 53.0, 48.0, 49.0, 58.0, 61.0, 48.0, 45.0, 42.0, 43.0, 39.0, 26.0, 22.0, 31.0, 17.0, 20.0, 16.0, 17.0, 13.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.601898193359375, -0.58123779296875, -0.560577392578125, -0.5399169921875, -0.519256591796875, -0.49859619140625, -0.477935791015625, -0.457275390625, -0.436614990234375, -0.41595458984375, -0.395294189453125, -0.3746337890625, -0.353973388671875, -0.33331298828125, -0.312652587890625, -0.2919921875, -0.271331787109375, -0.25067138671875, -0.230010986328125, -0.2093505859375, -0.188690185546875, -0.16802978515625, -0.147369384765625, -0.126708984375, -0.106048583984375, -0.08538818359375, -0.064727783203125, -0.0440673828125, -0.023406982421875, -0.00274658203125, 0.017913818359375, 0.03857421875, 0.059234619140625, 0.07989501953125, 0.100555419921875, 0.1212158203125, 0.141876220703125, 0.16253662109375, 0.183197021484375, 0.203857421875, 0.224517822265625, 0.24517822265625, 0.265838623046875, 0.2864990234375, 0.307159423828125, 0.32781982421875, 0.348480224609375, 0.369140625, 0.389801025390625, 0.41046142578125, 0.431121826171875, 0.4517822265625, 0.472442626953125, 0.49310302734375, 0.513763427734375, 0.534423828125, 0.555084228515625, 0.57574462890625, 0.596405029296875, 0.6170654296875, 0.637725830078125, 0.65838623046875, 0.679046630859375, 0.69970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 11.0, 10.0, 27.0, 45.0, 78.0, 124.0, 240.0, 399.0, 1020.0, 2681.0, 9628.0, 70576.0, 821431.0, 123401.0, 13391.0, 3264.0, 1138.0, 472.0, 247.0, 123.0, 72.0, 50.0, 30.0, 25.0, 15.0, 15.0, 2.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15262222290039062, -0.14728546142578125, -0.14194869995117188, -0.1366119384765625, -0.13127517700195312, -0.12593841552734375, -0.12060165405273438, -0.115264892578125, -0.10992813110351562, -0.10459136962890625, -0.09925460815429688, -0.0939178466796875, -0.08858108520507812, -0.08324432373046875, -0.07790756225585938, -0.07257080078125, -0.06723403930664062, -0.06189727783203125, -0.056560516357421875, -0.0512237548828125, -0.045886993408203125, -0.04055023193359375, -0.035213470458984375, -0.029876708984375, -0.024539947509765625, -0.01920318603515625, -0.013866424560546875, -0.0085296630859375, -0.003192901611328125, 0.00214385986328125, 0.007480621337890625, 0.0128173828125, 0.018154144287109375, 0.02349090576171875, 0.028827667236328125, 0.0341644287109375, 0.039501190185546875, 0.04483795166015625, 0.050174713134765625, 0.055511474609375, 0.060848236083984375, 0.06618499755859375, 0.07152175903320312, 0.0768585205078125, 0.08219528198242188, 0.08753204345703125, 0.09286880493164062, 0.09820556640625, 0.10354232788085938, 0.10887908935546875, 0.11421585083007812, 0.1195526123046875, 0.12488937377929688, 0.13022613525390625, 0.13556289672851562, 0.140899658203125, 0.14623641967773438, 0.15157318115234375, 0.15690994262695312, 0.1622467041015625, 0.16758346557617188, 0.17292022705078125, 0.17825698852539062, 0.18359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 11.0, 20.0, 17.0, 33.0, 47.0, 78.0, 108.0, 133.0, 158.0, 139.0, 82.0, 64.0, 47.0, 32.0, 13.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7463229596614838e-05, -1.6866251826286316e-05, -1.6269274055957794e-05, -1.5672296285629272e-05, -1.507531851530075e-05, -1.4478340744972229e-05, -1.3881362974643707e-05, -1.3284385204315186e-05, -1.2687407433986664e-05, -1.2090429663658142e-05, -1.149345189332962e-05, -1.0896474123001099e-05, -1.0299496352672577e-05, -9.702518582344055e-06, -9.105540812015533e-06, -8.508563041687012e-06, -7.91158527135849e-06, -7.314607501029968e-06, -6.7176297307014465e-06, -6.120651960372925e-06, -5.523674190044403e-06, -4.926696419715881e-06, -4.32971864938736e-06, -3.732740879058838e-06, -3.135763108730316e-06, -2.5387853384017944e-06, -1.9418075680732727e-06, -1.344829797744751e-06, -7.478520274162292e-07, -1.5087425708770752e-07, 4.461035132408142e-07, 1.043081283569336e-06, 1.6400590538978577e-06, 2.2370368242263794e-06, 2.834014594554901e-06, 3.430992364883423e-06, 4.027970135211945e-06, 4.624947905540466e-06, 5.221925675868988e-06, 5.81890344619751e-06, 6.4158812165260315e-06, 7.012858986854553e-06, 7.609836757183075e-06, 8.206814527511597e-06, 8.803792297840118e-06, 9.40077006816864e-06, 9.997747838497162e-06, 1.0594725608825684e-05, 1.1191703379154205e-05, 1.1788681149482727e-05, 1.2385658919811249e-05, 1.298263669013977e-05, 1.3579614460468292e-05, 1.4176592230796814e-05, 1.4773570001125336e-05, 1.5370547771453857e-05, 1.596752554178238e-05, 1.65645033121109e-05, 1.7161481082439423e-05, 1.7758458852767944e-05, 1.8355436623096466e-05, 1.8952414393424988e-05, 1.954939216375351e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 12.0, 13.0, 15.0, 19.0, 28.0, 58.0, 90.0, 215.0, 562.0, 2878.0, 49304.0, 972425.0, 20064.0, 2009.0, 465.0, 176.0, 80.0, 48.0, 34.0, 16.0, 9.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.4215507507324219, -0.40853118896484375, -0.3955116271972656, -0.3824920654296875, -0.3694725036621094, -0.35645294189453125, -0.3434333801269531, -0.330413818359375, -0.3173942565917969, -0.30437469482421875, -0.2913551330566406, -0.2783355712890625, -0.2653160095214844, -0.25229644775390625, -0.23927688598632812, -0.22625732421875, -0.21323776245117188, -0.20021820068359375, -0.18719863891601562, -0.1741790771484375, -0.16115951538085938, -0.14813995361328125, -0.13512039184570312, -0.122100830078125, -0.10908126831054688, -0.09606170654296875, -0.08304214477539062, -0.0700225830078125, -0.057003021240234375, -0.04398345947265625, -0.030963897705078125, -0.0179443359375, -0.004924774169921875, 0.00809478759765625, 0.021114349365234375, 0.0341339111328125, 0.047153472900390625, 0.06017303466796875, 0.07319259643554688, 0.086212158203125, 0.09923171997070312, 0.11225128173828125, 0.12527084350585938, 0.1382904052734375, 0.15130996704101562, 0.16432952880859375, 0.17734909057617188, 0.19036865234375, 0.20338821411132812, 0.21640777587890625, 0.22942733764648438, 0.2424468994140625, 0.2554664611816406, 0.26848602294921875, 0.2815055847167969, 0.294525146484375, 0.3075447082519531, 0.32056427001953125, 0.3335838317871094, 0.3466033935546875, 0.3596229553222656, 0.37264251708984375, 0.3856620788574219, 0.398681640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 8.0, 24.0, 29.0, 31.0, 60.0, 57.0, 87.0, 97.0, 110.0, 104.0, 90.0, 78.0, 53.0, 40.0, 24.0, 25.0, 12.0, 11.0, 8.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1566162109375, -0.1513347625732422, -0.14605331420898438, -0.14077186584472656, -0.13549041748046875, -0.13020896911621094, -0.12492752075195312, -0.11964607238769531, -0.1143646240234375, -0.10908317565917969, -0.10380172729492188, -0.09852027893066406, -0.09323883056640625, -0.08795738220214844, -0.08267593383789062, -0.07739448547363281, -0.072113037109375, -0.06683158874511719, -0.061550140380859375, -0.05626869201660156, -0.05098724365234375, -0.04570579528808594, -0.040424346923828125, -0.03514289855957031, -0.0298614501953125, -0.024580001831054688, -0.019298553466796875, -0.014017105102539062, -0.00873565673828125, -0.0034542083740234375, 0.001827239990234375, 0.0071086883544921875, 0.01239013671875, 0.017671585083007812, 0.022953033447265625, 0.028234481811523438, 0.03351593017578125, 0.03879737854003906, 0.044078826904296875, 0.04936027526855469, 0.0546417236328125, 0.05992317199707031, 0.06520462036132812, 0.07048606872558594, 0.07576751708984375, 0.08104896545410156, 0.08633041381835938, 0.09161186218261719, 0.096893310546875, 0.10217475891113281, 0.10745620727539062, 0.11273765563964844, 0.11801910400390625, 0.12330055236816406, 0.12858200073242188, 0.1338634490966797, 0.1391448974609375, 0.1444263458251953, 0.14970779418945312, 0.15498924255371094, 0.16027069091796875, 0.16555213928222656, 0.17083358764648438, 0.1761150360107422, 0.181396484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 20.0, 30.0, 73.0, 171.0, 334.0, 195.0, 78.0, 36.0, 26.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.589051246643066, -5.455007553100586, -5.320964336395264, -5.186920642852783, -5.052877426147461, -4.9188337326049805, -4.784790515899658, -4.650746822357178, -4.5167036056518555, -4.382659912109375, -4.248616695404053, -4.114573001861572, -3.98052978515625, -3.8464863300323486, -3.7124428749084473, -3.578399181365967, -3.4443557262420654, -3.310312271118164, -3.1762688159942627, -3.0422253608703613, -2.90818190574646, -2.7741384506225586, -2.640094757080078, -2.506051540374756, -2.3720078468322754, -2.237964391708374, -2.1039209365844727, -1.9698774814605713, -1.83583402633667, -1.7017905712127686, -1.5677469968795776, -1.4337035417556763, -1.2996599674224854, -1.165616512298584, -1.0315730571746826, -0.8975295424461365, -0.7634860873222351, -0.6294426321983337, -0.4953991174697876, -0.36135566234588623, -0.22731220722198486, -0.0932687371969223, 0.04077473282814026, 0.174818217754364, 0.3088616728782654, 0.44290512800216675, 0.5769486427307129, 0.7109920978546143, 0.8450355529785156, 0.979079008102417, 1.1131224632263184, 1.2471659183502197, 1.381209373474121, 1.5152528285980225, 1.6492964029312134, 1.7833398580551147, 1.9173833131790161, 2.051426887512207, 2.1854703426361084, 2.3195137977600098, 2.453557252883911, 2.5876007080078125, 2.721644163131714, 2.8556876182556152, 2.9897310733795166]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 18.0, 16.0, 18.0, 24.0, 24.0, 31.0, 31.0, 33.0, 43.0, 45.0, 48.0, 51.0, 44.0, 54.0, 60.0, 47.0, 49.0, 37.0, 35.0, 35.0, 31.0, 28.0, 28.0, 20.0, 24.0, 21.0, 14.0, 14.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11759090423584, -3.0048656463623047, -2.8921406269073486, -2.7794156074523926, -2.6666903495788574, -2.5539650917053223, -2.441240072250366, -2.32851505279541, -2.215789794921875, -2.10306453704834, -1.9903395175933838, -1.8776143789291382, -1.7648892402648926, -1.652164101600647, -1.5394389629364014, -1.4267138242721558, -1.3139886856079102, -1.2012635469436646, -1.088538408279419, -0.9758132696151733, -0.8630881309509277, -0.7503629922866821, -0.6376378536224365, -0.5249127149581909, -0.4121875762939453, -0.2994624376296997, -0.1867372989654541, -0.0740121603012085, 0.03871297836303711, 0.15143811702728271, 0.2641632556915283, 0.3768883943557739, 0.48961353302001953, 0.6023386716842651, 0.7150638103485107, 0.8277889490127563, 0.940514087677002, 1.0532392263412476, 1.1659643650054932, 1.2786895036697388, 1.3914146423339844, 1.50413978099823, 1.6168649196624756, 1.7295900583267212, 1.8423151969909668, 1.9550403356552124, 2.067765474319458, 2.180490493774414, 2.293215751647949, 2.4059410095214844, 2.5186660289764404, 2.6313910484313965, 2.7441163063049316, 2.856841564178467, 2.969566583633423, 3.082291603088379, 3.195016860961914, 3.307742118835449, 3.4204671382904053, 3.5331921577453613, 3.6459174156188965, 3.7586426734924316, 3.8713676929473877, 3.9840927124023438, 4.096817970275879]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 11.0, 21.0, 53.0, 233.0, 2143.0, 4190961.0, 684.0, 105.0, 34.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.29296875, -7.1246337890625, -6.956298828125, -6.7879638671875, -6.61962890625, -6.4512939453125, -6.282958984375, -6.1146240234375, -5.9462890625, -5.7779541015625, -5.609619140625, -5.4412841796875, -5.27294921875, -5.1046142578125, -4.936279296875, -4.7679443359375, -4.599609375, -4.4312744140625, -4.262939453125, -4.0946044921875, -3.92626953125, -3.7579345703125, -3.589599609375, -3.4212646484375, -3.2529296875, -3.0845947265625, -2.916259765625, -2.7479248046875, -2.57958984375, -2.4112548828125, -2.242919921875, -2.0745849609375, -1.90625, -1.7379150390625, -1.569580078125, -1.4012451171875, -1.23291015625, -1.0645751953125, -0.896240234375, -0.7279052734375, -0.5595703125, -0.3912353515625, -0.222900390625, -0.0545654296875, 0.11376953125, 0.2821044921875, 0.450439453125, 0.6187744140625, 0.787109375, 0.9554443359375, 1.123779296875, 1.2921142578125, 1.46044921875, 1.6287841796875, 1.797119140625, 1.9654541015625, 2.1337890625, 2.3021240234375, 2.470458984375, 2.6387939453125, 2.80712890625, 2.9754638671875, 3.143798828125, 3.3121337890625, 3.48046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 17.0, 74.0, 179.0, 351.0, 248.0, 79.0, 26.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.7013053894042969, -0.6848373413085938, -0.6683692932128906, -0.6519012451171875, -0.6354331970214844, -0.6189651489257812, -0.6024971008300781, -0.586029052734375, -0.5695610046386719, -0.5530929565429688, -0.5366249084472656, -0.5201568603515625, -0.5036888122558594, -0.48722076416015625, -0.4707527160644531, -0.45428466796875, -0.4378166198730469, -0.42134857177734375, -0.4048805236816406, -0.3884124755859375, -0.3719444274902344, -0.35547637939453125, -0.3390083312988281, -0.322540283203125, -0.3060722351074219, -0.28960418701171875, -0.2731361389160156, -0.2566680908203125, -0.24020004272460938, -0.22373199462890625, -0.20726394653320312, -0.1907958984375, -0.17432785034179688, -0.15785980224609375, -0.14139175415039062, -0.1249237060546875, -0.10845565795898438, -0.09198760986328125, -0.07551956176757812, -0.059051513671875, -0.042583465576171875, -0.02611541748046875, -0.009647369384765625, 0.0068206787109375, 0.023288726806640625, 0.03975677490234375, 0.056224822998046875, 0.07269287109375, 0.08916091918945312, 0.10562896728515625, 0.12209701538085938, 0.1385650634765625, 0.15503311157226562, 0.17150115966796875, 0.18796920776367188, 0.204437255859375, 0.22090530395507812, 0.23737335205078125, 0.2538414001464844, 0.2703094482421875, 0.2867774963378906, 0.30324554443359375, 0.3197135925292969, 0.336181640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 8.0, 10.0, 27.0, 50.0, 81.0, 177.0, 428.0, 1198.0, 4495.0, 49177.0, 4115217.0, 19232.0, 2854.0, 772.0, 264.0, 131.0, 61.0, 34.0, 27.0, 13.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.965850830078125, -0.93853759765625, -0.911224365234375, -0.8839111328125, -0.856597900390625, -0.82928466796875, -0.801971435546875, -0.774658203125, -0.747344970703125, -0.72003173828125, -0.692718505859375, -0.6654052734375, -0.638092041015625, -0.61077880859375, -0.583465576171875, -0.55615234375, -0.528839111328125, -0.50152587890625, -0.474212646484375, -0.4468994140625, -0.419586181640625, -0.39227294921875, -0.364959716796875, -0.337646484375, -0.310333251953125, -0.28302001953125, -0.255706787109375, -0.2283935546875, -0.201080322265625, -0.17376708984375, -0.146453857421875, -0.119140625, -0.091827392578125, -0.06451416015625, -0.037200927734375, -0.0098876953125, 0.017425537109375, 0.04473876953125, 0.072052001953125, 0.099365234375, 0.126678466796875, 0.15399169921875, 0.181304931640625, 0.2086181640625, 0.235931396484375, 0.26324462890625, 0.290557861328125, 0.31787109375, 0.345184326171875, 0.37249755859375, 0.399810791015625, 0.4271240234375, 0.454437255859375, 0.48175048828125, 0.509063720703125, 0.536376953125, 0.563690185546875, 0.59100341796875, 0.618316650390625, 0.6456298828125, 0.672943115234375, 0.70025634765625, 0.727569580078125, 0.7548828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 11.0, 7.0, 10.0, 18.0, 45.0, 106.0, 1009.0, 2657.0, 115.0, 35.0, 23.0, 16.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18136024475097656, -0.17412185668945312, -0.1668834686279297, -0.15964508056640625, -0.1524066925048828, -0.14516830444335938, -0.13792991638183594, -0.1306915283203125, -0.12345314025878906, -0.11621475219726562, -0.10897636413574219, -0.10173797607421875, -0.09449958801269531, -0.08726119995117188, -0.08002281188964844, -0.072784423828125, -0.06554603576660156, -0.058307647705078125, -0.05106925964355469, -0.04383087158203125, -0.03659248352050781, -0.029354095458984375, -0.022115707397460938, -0.0148773193359375, -0.0076389312744140625, -0.000400543212890625, 0.0068378448486328125, 0.01407623291015625, 0.021314620971679688, 0.028553009033203125, 0.03579139709472656, 0.04302978515625, 0.05026817321777344, 0.057506561279296875, 0.06474494934082031, 0.07198333740234375, 0.07922172546386719, 0.08646011352539062, 0.09369850158691406, 0.1009368896484375, 0.10817527770996094, 0.11541366577148438, 0.12265205383300781, 0.12989044189453125, 0.1371288299560547, 0.14436721801757812, 0.15160560607910156, 0.158843994140625, 0.16608238220214844, 0.17332077026367188, 0.1805591583251953, 0.18779754638671875, 0.1950359344482422, 0.20227432250976562, 0.20951271057128906, 0.2167510986328125, 0.22398948669433594, 0.23122787475585938, 0.2384662628173828, 0.24570465087890625, 0.2529430389404297, 0.2601814270019531, 0.26741981506347656, 0.274658203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 165.0, 847.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3448017835617065, -1.1571334600448608, -0.9694650173187256, -0.7817966938018799, -0.5941283106803894, -0.4064599275588989, -0.21879160404205322, -0.03112316131591797, 0.15654516220092773, 0.3442135453224182, 0.5318819284439087, 0.7195502519607544, 0.9072186350822449, 1.0948870182037354, 1.282555341720581, 1.4702237844467163, 1.657892107963562, 1.8455604314804077, 2.033228874206543, 2.2208971977233887, 2.4085655212402344, 2.59623384475708, 2.783902168273926, 2.9715707302093506, 3.1592390537261963, 3.346907377243042, 3.5345757007598877, 3.7222442626953125, 3.909912586212158, 4.097580909729004, 4.28524923324585, 4.472917556762695, 4.660585880279541, 4.848254203796387, 5.035922527313232, 5.223590850830078, 5.411259174346924, 5.5989274978637695, 5.786596298217773, 5.974264621734619, 6.161932945251465, 6.3496012687683105, 6.537269592285156, 6.724937915802002, 6.912606239318848, 7.100275039672852, 7.287942886352539, 7.475611686706543, 7.6632795333862305, 7.850947856903076, 8.038616180419922, 8.226284980773926, 8.413952827453613, 8.601621627807617, 8.789289474487305, 8.976958274841309, 9.164627075195312, 9.352295875549316, 9.539963722229004, 9.727632522583008, 9.915300369262695, 10.1029691696167, 10.290637016296387, 10.47830581665039, 10.665973663330078]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 10.0, 16.0, 18.0, 23.0, 30.0, 37.0, 35.0, 50.0, 61.0, 43.0, 51.0, 74.0, 68.0, 65.0, 71.0, 54.0, 43.0, 50.0, 38.0, 31.0, 19.0, 15.0, 20.0, 21.0, 13.0, 6.0, 7.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47241783142089844, -0.4569101929664612, -0.4414025545120239, -0.42589494585990906, -0.4103873074054718, -0.39487966895103455, -0.3793720602989197, -0.3638644218444824, -0.34835678339004517, -0.3328491449356079, -0.31734150648117065, -0.3018338978290558, -0.28632625937461853, -0.2708186209201813, -0.2553110122680664, -0.23980337381362915, -0.2242957353591919, -0.20878809690475464, -0.19328047335147858, -0.17777284979820251, -0.16226521134376526, -0.146757572889328, -0.13124994933605194, -0.11574231833219528, -0.10023468732833862, -0.08472705632448196, -0.0692194253206253, -0.053711794316768646, -0.03820416331291199, -0.02269653230905533, -0.007188901305198669, 0.00831872969865799, 0.02382636070251465, 0.03933399170637131, 0.054841622710227966, 0.07034925371408463, 0.08585688471794128, 0.10136451572179794, 0.1168721467256546, 0.13237977027893066, 0.14788740873336792, 0.16339504718780518, 0.17890267074108124, 0.1944102942943573, 0.20991793274879456, 0.2254255712032318, 0.24093319475650787, 0.25644081830978394, 0.2719484567642212, 0.28745609521865845, 0.3029637336730957, 0.31847134232521057, 0.3339789807796478, 0.3494866192340851, 0.36499422788619995, 0.3805018663406372, 0.39600950479507446, 0.4115171432495117, 0.427024781703949, 0.44253239035606384, 0.4580400288105011, 0.47354766726493835, 0.4890552759170532, 0.5045629143714905, 0.5200705528259277]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 3.0, 11.0, 9.0, 7.0, 10.0, 22.0, 27.0, 29.0, 32.0, 56.0, 88.0, 136.0, 183.0, 380.0, 615.0, 1332.0, 3474.0, 24567.0, 927429.0, 80722.0, 5634.0, 1781.0, 823.0, 406.0, 264.0, 165.0, 96.0, 56.0, 48.0, 34.0, 24.0, 14.0, 11.0, 13.0, 8.0, 6.0, 9.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.3041534423828125, -1.261627197265625, -1.2191009521484375, -1.17657470703125, -1.1340484619140625, -1.091522216796875, -1.0489959716796875, -1.0064697265625, -0.9639434814453125, -0.921417236328125, -0.8788909912109375, -0.83636474609375, -0.7938385009765625, -0.751312255859375, -0.7087860107421875, -0.666259765625, -0.6237335205078125, -0.581207275390625, -0.5386810302734375, -0.49615478515625, -0.4536285400390625, -0.411102294921875, -0.3685760498046875, -0.3260498046875, -0.2835235595703125, -0.240997314453125, -0.1984710693359375, -0.15594482421875, -0.1134185791015625, -0.070892333984375, -0.0283660888671875, 0.01416015625, 0.0566864013671875, 0.099212646484375, 0.1417388916015625, 0.18426513671875, 0.2267913818359375, 0.269317626953125, 0.3118438720703125, 0.3543701171875, 0.3968963623046875, 0.439422607421875, 0.4819488525390625, 0.52447509765625, 0.5670013427734375, 0.609527587890625, 0.6520538330078125, 0.694580078125, 0.7371063232421875, 0.779632568359375, 0.8221588134765625, 0.86468505859375, 0.9072113037109375, 0.949737548828125, 0.9922637939453125, 1.0347900390625, 1.0773162841796875, 1.119842529296875, 1.1623687744140625, 1.20489501953125, 1.2474212646484375, 1.289947509765625, 1.3324737548828125, 1.375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 22.0, 79.0, 217.0, 346.0, 221.0, 69.0, 22.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.693145751953125, -0.67681884765625, -0.660491943359375, -0.6441650390625, -0.627838134765625, -0.61151123046875, -0.595184326171875, -0.578857421875, -0.562530517578125, -0.54620361328125, -0.529876708984375, -0.5135498046875, -0.497222900390625, -0.48089599609375, -0.464569091796875, -0.4482421875, -0.431915283203125, -0.41558837890625, -0.399261474609375, -0.3829345703125, -0.366607666015625, -0.35028076171875, -0.333953857421875, -0.317626953125, -0.301300048828125, -0.28497314453125, -0.268646240234375, -0.2523193359375, -0.235992431640625, -0.21966552734375, -0.203338623046875, -0.18701171875, -0.170684814453125, -0.15435791015625, -0.138031005859375, -0.1217041015625, -0.105377197265625, -0.08905029296875, -0.072723388671875, -0.056396484375, -0.040069580078125, -0.02374267578125, -0.007415771484375, 0.0089111328125, 0.025238037109375, 0.04156494140625, 0.057891845703125, 0.07421875, 0.090545654296875, 0.10687255859375, 0.123199462890625, 0.1395263671875, 0.155853271484375, 0.17218017578125, 0.188507080078125, 0.204833984375, 0.221160888671875, 0.23748779296875, 0.253814697265625, 0.2701416015625, 0.286468505859375, 0.30279541015625, 0.319122314453125, 0.33544921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 9.0, 8.0, 8.0, 13.0, 20.0, 22.0, 20.0, 27.0, 46.0, 67.0, 117.0, 179.0, 347.0, 915.0, 3391.0, 19494.0, 259359.0, 716084.0, 40300.0, 5624.0, 1375.0, 443.0, 230.0, 132.0, 85.0, 53.0, 34.0, 24.0, 19.0, 12.0, 13.0, 11.0, 6.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.00390625, -0.9706268310546875, -0.937347412109375, -0.9040679931640625, -0.87078857421875, -0.8375091552734375, -0.804229736328125, -0.7709503173828125, -0.7376708984375, -0.7043914794921875, -0.671112060546875, -0.6378326416015625, -0.60455322265625, -0.5712738037109375, -0.537994384765625, -0.5047149658203125, -0.471435546875, -0.4381561279296875, -0.404876708984375, -0.3715972900390625, -0.33831787109375, -0.3050384521484375, -0.271759033203125, -0.2384796142578125, -0.2052001953125, -0.1719207763671875, -0.138641357421875, -0.1053619384765625, -0.07208251953125, -0.0388031005859375, -0.005523681640625, 0.0277557373046875, 0.06103515625, 0.0943145751953125, 0.127593994140625, 0.1608734130859375, 0.19415283203125, 0.2274322509765625, 0.260711669921875, 0.2939910888671875, 0.3272705078125, 0.3605499267578125, 0.393829345703125, 0.4271087646484375, 0.46038818359375, 0.4936676025390625, 0.526947021484375, 0.5602264404296875, 0.593505859375, 0.6267852783203125, 0.660064697265625, 0.6933441162109375, 0.72662353515625, 0.7599029541015625, 0.793182373046875, 0.8264617919921875, 0.8597412109375, 0.8930206298828125, 0.926300048828125, 0.9595794677734375, 0.99285888671875, 1.0261383056640625, 1.059417724609375, 1.0926971435546875, 1.1259765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 10.0, 14.0, 12.0, 16.0, 19.0, 24.0, 33.0, 27.0, 37.0, 48.0, 51.0, 45.0, 49.0, 36.0, 42.0, 41.0, 49.0, 53.0, 47.0, 40.0, 44.0, 35.0, 23.0, 29.0, 19.0, 17.0, 17.0, 22.0, 6.0, 8.0, 9.0, 13.0, 5.0, 2.0, 11.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6125640869140625, -0.593780517578125, -0.5749969482421875, -0.55621337890625, -0.5374298095703125, -0.518646240234375, -0.4998626708984375, -0.4810791015625, -0.4622955322265625, -0.443511962890625, -0.4247283935546875, -0.40594482421875, -0.3871612548828125, -0.368377685546875, -0.3495941162109375, -0.330810546875, -0.3120269775390625, -0.293243408203125, -0.2744598388671875, -0.25567626953125, -0.2368927001953125, -0.218109130859375, -0.1993255615234375, -0.1805419921875, -0.1617584228515625, -0.142974853515625, -0.1241912841796875, -0.10540771484375, -0.0866241455078125, -0.067840576171875, -0.0490570068359375, -0.0302734375, -0.0114898681640625, 0.007293701171875, 0.0260772705078125, 0.04486083984375, 0.0636444091796875, 0.082427978515625, 0.1012115478515625, 0.1199951171875, 0.1387786865234375, 0.157562255859375, 0.1763458251953125, 0.19512939453125, 0.2139129638671875, 0.232696533203125, 0.2514801025390625, 0.270263671875, 0.2890472412109375, 0.307830810546875, 0.3266143798828125, 0.34539794921875, 0.3641815185546875, 0.382965087890625, 0.4017486572265625, 0.4205322265625, 0.4393157958984375, 0.458099365234375, 0.4768829345703125, 0.49566650390625, 0.5144500732421875, 0.533233642578125, 0.5520172119140625, 0.57080078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 20.0, 41.0, 63.0, 111.0, 208.0, 443.0, 1179.0, 4575.0, 32712.0, 738718.0, 251722.0, 14512.0, 2664.0, 848.0, 335.0, 162.0, 74.0, 39.0, 31.0, 22.0, 16.0, 12.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.1399250030517578, -0.13470840454101562, -0.12949180603027344, -0.12427520751953125, -0.11905860900878906, -0.11384201049804688, -0.10862541198730469, -0.1034088134765625, -0.09819221496582031, -0.09297561645507812, -0.08775901794433594, -0.08254241943359375, -0.07732582092285156, -0.07210922241210938, -0.06689262390136719, -0.061676025390625, -0.05645942687988281, -0.051242828369140625, -0.04602622985839844, -0.04080963134765625, -0.03559303283691406, -0.030376434326171875, -0.025159835815429688, -0.0199432373046875, -0.014726638793945312, -0.009510040283203125, -0.0042934417724609375, 0.00092315673828125, 0.0061397552490234375, 0.011356353759765625, 0.016572952270507812, 0.02178955078125, 0.027006149291992188, 0.032222747802734375, 0.03743934631347656, 0.04265594482421875, 0.04787254333496094, 0.053089141845703125, 0.05830574035644531, 0.0635223388671875, 0.06873893737792969, 0.07395553588867188, 0.07917213439941406, 0.08438873291015625, 0.08960533142089844, 0.09482192993164062, 0.10003852844238281, 0.105255126953125, 0.11047172546386719, 0.11568832397460938, 0.12090492248535156, 0.12612152099609375, 0.13133811950683594, 0.13655471801757812, 0.1417713165283203, 0.1469879150390625, 0.1522045135498047, 0.15742111206054688, 0.16263771057128906, 0.16785430908203125, 0.17307090759277344, 0.17828750610351562, 0.1835041046142578, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 11.0, 13.0, 12.0, 24.0, 28.0, 31.0, 40.0, 47.0, 38.0, 76.0, 92.0, 79.0, 59.0, 76.0, 69.0, 64.0, 44.0, 42.0, 22.0, 13.0, 21.0, 19.0, 16.0, 8.0, 6.0, 6.0, 1.0, 7.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.120441973209381e-06, -8.823350071907043e-06, -8.526258170604706e-06, -8.229166269302368e-06, -7.93207436800003e-06, -7.634982466697693e-06, -7.337890565395355e-06, -7.040798664093018e-06, -6.74370676279068e-06, -6.446614861488342e-06, -6.149522960186005e-06, -5.852431058883667e-06, -5.555339157581329e-06, -5.258247256278992e-06, -4.961155354976654e-06, -4.664063453674316e-06, -4.366971552371979e-06, -4.069879651069641e-06, -3.7727877497673035e-06, -3.475695848464966e-06, -3.178603947162628e-06, -2.8815120458602905e-06, -2.584420144557953e-06, -2.2873282432556152e-06, -1.9902363419532776e-06, -1.69314444065094e-06, -1.3960525393486023e-06, -1.0989606380462646e-06, -8.01868736743927e-07, -5.047768354415894e-07, -2.076849341392517e-07, 8.940696716308594e-08, 3.864988684654236e-07, 6.835907697677612e-07, 9.806826710700989e-07, 1.2777745723724365e-06, 1.5748664736747742e-06, 1.8719583749771118e-06, 2.1690502762794495e-06, 2.466142177581787e-06, 2.7632340788841248e-06, 3.0603259801864624e-06, 3.3574178814888e-06, 3.6545097827911377e-06, 3.951601684093475e-06, 4.248693585395813e-06, 4.545785486698151e-06, 4.842877388000488e-06, 5.139969289302826e-06, 5.4370611906051636e-06, 5.734153091907501e-06, 6.031244993209839e-06, 6.3283368945121765e-06, 6.625428795814514e-06, 6.922520697116852e-06, 7.2196125984191895e-06, 7.516704499721527e-06, 7.813796401023865e-06, 8.110888302326202e-06, 8.40798020362854e-06, 8.705072104930878e-06, 9.002164006233215e-06, 9.299255907535553e-06, 9.59634780883789e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 24.0, 45.0, 52.0, 105.0, 212.0, 568.0, 1994.0, 12251.0, 391001.0, 623049.0, 15754.0, 2279.0, 629.0, 231.0, 98.0, 62.0, 42.0, 22.0, 24.0, 14.0, 17.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2203369140625, -0.21300506591796875, -0.2056732177734375, -0.19834136962890625, -0.191009521484375, -0.18367767333984375, -0.1763458251953125, -0.16901397705078125, -0.16168212890625, -0.15435028076171875, -0.1470184326171875, -0.13968658447265625, -0.132354736328125, -0.12502288818359375, -0.1176910400390625, -0.11035919189453125, -0.10302734375, -0.09569549560546875, -0.0883636474609375, -0.08103179931640625, -0.073699951171875, -0.06636810302734375, -0.0590362548828125, -0.05170440673828125, -0.04437255859375, -0.03704071044921875, -0.0297088623046875, -0.02237701416015625, -0.015045166015625, -0.00771331787109375, -0.0003814697265625, 0.00695037841796875, 0.0142822265625, 0.02161407470703125, 0.0289459228515625, 0.03627777099609375, 0.043609619140625, 0.05094146728515625, 0.0582733154296875, 0.06560516357421875, 0.07293701171875, 0.08026885986328125, 0.0876007080078125, 0.09493255615234375, 0.102264404296875, 0.10959625244140625, 0.1169281005859375, 0.12425994873046875, 0.131591796875, 0.13892364501953125, 0.1462554931640625, 0.15358734130859375, 0.160919189453125, 0.16825103759765625, 0.1755828857421875, 0.18291473388671875, 0.19024658203125, 0.19757843017578125, 0.2049102783203125, 0.21224212646484375, 0.219573974609375, 0.22690582275390625, 0.2342376708984375, 0.24156951904296875, 0.2489013671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 14.0, 16.0, 12.0, 24.0, 24.0, 31.0, 41.0, 56.0, 65.0, 85.0, 89.0, 109.0, 94.0, 67.0, 59.0, 41.0, 38.0, 29.0, 18.0, 19.0, 16.0, 9.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.1301097869873047, -0.12618637084960938, -0.12226295471191406, -0.11833953857421875, -0.11441612243652344, -0.11049270629882812, -0.10656929016113281, -0.1026458740234375, -0.09872245788574219, -0.09479904174804688, -0.09087562561035156, -0.08695220947265625, -0.08302879333496094, -0.07910537719726562, -0.07518196105957031, -0.071258544921875, -0.06733512878417969, -0.06341171264648438, -0.05948829650878906, -0.05556488037109375, -0.05164146423339844, -0.047718048095703125, -0.04379463195800781, -0.0398712158203125, -0.03594779968261719, -0.032024383544921875, -0.028100967407226562, -0.02417755126953125, -0.020254135131835938, -0.016330718994140625, -0.012407302856445312, -0.00848388671875, -0.0045604705810546875, -0.000637054443359375, 0.0032863616943359375, 0.00720977783203125, 0.011133193969726562, 0.015056610107421875, 0.018980026245117188, 0.0229034423828125, 0.026826858520507812, 0.030750274658203125, 0.03467369079589844, 0.03859710693359375, 0.04252052307128906, 0.046443939208984375, 0.05036735534667969, 0.054290771484375, 0.05821418762207031, 0.062137603759765625, 0.06606101989746094, 0.06998443603515625, 0.07390785217285156, 0.07783126831054688, 0.08175468444824219, 0.0856781005859375, 0.08960151672363281, 0.09352493286132812, 0.09744834899902344, 0.10137176513671875, 0.10529518127441406, 0.10921859741210938, 0.11314201354980469, 0.1170654296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 14.0, 13.0, 24.0, 38.0, 79.0, 178.0, 280.0, 182.0, 75.0, 38.0, 34.0, 19.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.151472091674805, -5.03578519821167, -4.920098304748535, -4.8044114112854, -4.688724517822266, -4.573037624359131, -4.457350730895996, -4.341663837432861, -4.225976943969727, -4.110290050506592, -3.994603157043457, -3.8789162635803223, -3.7632293701171875, -3.6475424766540527, -3.531855583190918, -3.416168689727783, -3.3004820346832275, -3.1847951412200928, -3.069108247756958, -2.9534213542938232, -2.8377344608306885, -2.7220475673675537, -2.606360912322998, -2.4906740188598633, -2.3749871253967285, -2.2593002319335938, -2.143613338470459, -2.027926445007324, -1.9122395515441895, -1.7965526580810547, -1.6808658838272095, -1.5651789903640747, -1.4494922161102295, -1.3338053226470947, -1.21811842918396, -1.1024315357208252, -0.9867447018623352, -0.8710578083992004, -0.7553709745407104, -0.6396840810775757, -0.5239971876144409, -0.40831029415130615, -0.2926234304904938, -0.1769365668296814, -0.06124967336654663, 0.054437220096588135, 0.17012405395507812, 0.2858109474182129, 0.40149784088134766, 0.5171847343444824, 0.6328716278076172, 0.7485584616661072, 0.8642453551292419, 0.9799322485923767, 1.0956190824508667, 1.2113059759140015, 1.3269928693771362, 1.442679762840271, 1.5583666563034058, 1.674053430557251, 1.7897403240203857, 1.9054272174835205, 2.0211141109466553, 2.13680100440979, 2.252487897872925]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 5.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 13.0, 24.0, 40.0, 37.0, 30.0, 44.0, 48.0, 56.0, 49.0, 55.0, 47.0, 43.0, 50.0, 57.0, 60.0, 50.0, 32.0, 25.0, 32.0, 33.0, 19.0, 17.0, 14.0, 15.0, 3.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.053379058837891, -3.934798002243042, -3.8162171840667725, -3.697636127471924, -3.5790553092956543, -3.4604742527008057, -3.341893196105957, -3.2233123779296875, -3.104731321334839, -2.9861502647399902, -2.8675694465637207, -2.748988389968872, -2.6304073333740234, -2.511826515197754, -2.3932454586029053, -2.2746644020080566, -2.156083583831787, -2.0375025272369385, -1.918921709060669, -1.8003406524658203, -1.6817597150802612, -1.5631787776947021, -1.4445977210998535, -1.3260167837142944, -1.2074358463287354, -1.0888549089431763, -0.9702739119529724, -0.8516929149627686, -0.7331119775772095, -0.6145310401916504, -0.49595004320144653, -0.3773690462112427, -0.2587881088256836, -0.14020714163780212, -0.021626174449920654, 0.09695479273796082, 0.21553575992584229, 0.33411669731140137, 0.4526976943016052, 0.5712786912918091, 0.6898596286773682, 0.8084405660629272, 0.9270215630531311, 1.045602560043335, 1.164183497428894, 1.2827644348144531, 1.4013454914093018, 1.5199264287948608, 1.63850736618042, 1.757088303565979, 1.875669240951538, 1.9942502975463867, 2.1128311157226562, 2.231412172317505, 2.3499932289123535, 2.468574047088623, 2.5871551036834717, 2.7057361602783203, 2.82431697845459, 2.9428980350494385, 3.061479091644287, 3.1800599098205566, 3.2986409664154053, 3.417222023010254, 3.5358028411865234]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 12.0, 17.0, 18.0, 20.0, 42.0, 84.0, 145.0, 288.0, 1039.0, 8329.0, 4170192.0, 12353.0, 1152.0, 320.0, 112.0, 55.0, 40.0, 18.0, 13.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.94256591796875, -2.8734130859375, -2.80426025390625, -2.735107421875, -2.66595458984375, -2.5968017578125, -2.52764892578125, -2.45849609375, -2.38934326171875, -2.3201904296875, -2.25103759765625, -2.181884765625, -2.11273193359375, -2.0435791015625, -1.97442626953125, -1.9052734375, -1.83612060546875, -1.7669677734375, -1.69781494140625, -1.628662109375, -1.55950927734375, -1.4903564453125, -1.42120361328125, -1.35205078125, -1.28289794921875, -1.2137451171875, -1.14459228515625, -1.075439453125, -1.00628662109375, -0.9371337890625, -0.86798095703125, -0.798828125, -0.72967529296875, -0.6605224609375, -0.59136962890625, -0.522216796875, -0.45306396484375, -0.3839111328125, -0.31475830078125, -0.24560546875, -0.17645263671875, -0.1072998046875, -0.03814697265625, 0.031005859375, 0.10015869140625, 0.1693115234375, 0.23846435546875, 0.3076171875, 0.37677001953125, 0.4459228515625, 0.51507568359375, 0.584228515625, 0.65338134765625, 0.7225341796875, 0.79168701171875, 0.86083984375, 0.92999267578125, 0.9991455078125, 1.06829833984375, 1.137451171875, 1.20660400390625, 1.2757568359375, 1.34490966796875, 1.4140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 21.0, 75.0, 193.0, 306.0, 261.0, 79.0, 35.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7127761840820312, -0.6960601806640625, -0.6793441772460938, -0.662628173828125, -0.6459121704101562, -0.6291961669921875, -0.6124801635742188, -0.59576416015625, -0.5790481567382812, -0.5623321533203125, -0.5456161499023438, -0.528900146484375, -0.5121841430664062, -0.4954681396484375, -0.47875213623046875, -0.4620361328125, -0.44532012939453125, -0.4286041259765625, -0.41188812255859375, -0.395172119140625, -0.37845611572265625, -0.3617401123046875, -0.34502410888671875, -0.32830810546875, -0.31159210205078125, -0.2948760986328125, -0.27816009521484375, -0.261444091796875, -0.24472808837890625, -0.2280120849609375, -0.21129608154296875, -0.194580078125, -0.17786407470703125, -0.1611480712890625, -0.14443206787109375, -0.127716064453125, -0.11100006103515625, -0.0942840576171875, -0.07756805419921875, -0.06085205078125, -0.04413604736328125, -0.0274200439453125, -0.01070404052734375, 0.006011962890625, 0.02272796630859375, 0.0394439697265625, 0.05615997314453125, 0.0728759765625, 0.08959197998046875, 0.1063079833984375, 0.12302398681640625, 0.139739990234375, 0.15645599365234375, 0.1731719970703125, 0.18988800048828125, 0.20660400390625, 0.22332000732421875, 0.2400360107421875, 0.25675201416015625, 0.273468017578125, 0.29018402099609375, 0.3069000244140625, 0.32361602783203125, 0.34033203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 2.0, 5.0, 7.0, 23.0, 45.0, 89.0, 302.0, 1170.0, 6840.0, 4122682.0, 59438.0, 2796.0, 513.0, 167.0, 93.0, 43.0, 22.0, 22.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.570159912109375, -2.50555419921875, -2.440948486328125, -2.3763427734375, -2.311737060546875, -2.24713134765625, -2.182525634765625, -2.117919921875, -2.053314208984375, -1.98870849609375, -1.924102783203125, -1.8594970703125, -1.794891357421875, -1.73028564453125, -1.665679931640625, -1.60107421875, -1.536468505859375, -1.47186279296875, -1.407257080078125, -1.3426513671875, -1.278045654296875, -1.21343994140625, -1.148834228515625, -1.084228515625, -1.019622802734375, -0.95501708984375, -0.890411376953125, -0.8258056640625, -0.761199951171875, -0.69659423828125, -0.631988525390625, -0.5673828125, -0.502777099609375, -0.43817138671875, -0.373565673828125, -0.3089599609375, -0.244354248046875, -0.17974853515625, -0.115142822265625, -0.050537109375, 0.014068603515625, 0.07867431640625, 0.143280029296875, 0.2078857421875, 0.272491455078125, 0.33709716796875, 0.401702880859375, 0.46630859375, 0.530914306640625, 0.59552001953125, 0.660125732421875, 0.7247314453125, 0.789337158203125, 0.85394287109375, 0.918548583984375, 0.983154296875, 1.047760009765625, 1.11236572265625, 1.176971435546875, 1.2415771484375, 1.306182861328125, 1.37078857421875, 1.435394287109375, 1.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 17.0, 29.0, 91.0, 271.0, 3305.0, 228.0, 53.0, 29.0, 11.0, 9.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4466972351074219, -0.42684173583984375, -0.4069862365722656, -0.3871307373046875, -0.3672752380371094, -0.34741973876953125, -0.3275642395019531, -0.307708740234375, -0.2878532409667969, -0.26799774169921875, -0.24814224243164062, -0.2282867431640625, -0.20843124389648438, -0.18857574462890625, -0.16872024536132812, -0.14886474609375, -0.12900924682617188, -0.10915374755859375, -0.08929824829101562, -0.0694427490234375, -0.049587249755859375, -0.02973175048828125, -0.009876251220703125, 0.009979248046875, 0.029834747314453125, 0.04969024658203125, 0.06954574584960938, 0.0894012451171875, 0.10925674438476562, 0.12911224365234375, 0.14896774291992188, 0.1688232421875, 0.18867874145507812, 0.20853424072265625, 0.22838973999023438, 0.2482452392578125, 0.2681007385253906, 0.28795623779296875, 0.3078117370605469, 0.327667236328125, 0.3475227355957031, 0.36737823486328125, 0.3872337341308594, 0.4070892333984375, 0.4269447326660156, 0.44680023193359375, 0.4666557312011719, 0.48651123046875, 0.5063667297363281, 0.5262222290039062, 0.5460777282714844, 0.5659332275390625, 0.5857887268066406, 0.6056442260742188, 0.6254997253417969, 0.645355224609375, 0.6652107238769531, 0.6850662231445312, 0.7049217224121094, 0.7247772216796875, 0.7446327209472656, 0.7644882202148438, 0.7843437194824219, 0.80419921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 10.0, 50.0, 431.0, 431.0, 50.0, 18.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220455169677734, -4.1127448081970215, -4.005034446716309, -3.8973240852355957, -3.789613723754883, -3.68190336227417, -3.574192762374878, -3.466482400894165, -3.358772039413452, -3.2510616779327393, -3.1433513164520264, -3.0356409549713135, -2.9279303550720215, -2.8202199935913086, -2.7125096321105957, -2.604799270629883, -2.49708890914917, -2.389378547668457, -2.281668186187744, -2.1739578247070312, -2.0662474632263184, -1.958536982536316, -1.8508265018463135, -1.7431161403656006, -1.6354057788848877, -1.5276954174041748, -1.419985055923462, -1.3122745752334595, -1.2045642137527466, -1.0968538522720337, -0.989143431186676, -0.8814330101013184, -0.7737228870391846, -0.6660125255584717, -0.558302104473114, -0.45059171319007874, -0.34288132190704346, -0.23517096042633057, -0.1274605393409729, -0.019750118255615234, 0.08796024322509766, 0.19567063450813293, 0.3033810257911682, 0.4110914170742035, 0.5188018083572388, 0.6265121698379517, 0.7342225909233093, 0.841933012008667, 0.9496433734893799, 1.0573537349700928, 1.1650640964508057, 1.272774577140808, 1.380484938621521, 1.4881953001022339, 1.5959057807922363, 1.7036161422729492, 1.811326503753662, 1.919036865234375, 2.026747226715088, 2.134457588195801, 2.2421679496765137, 2.3498783111572266, 2.4575889110565186, 2.5652992725372314, 2.6730096340179443]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 26.0, 33.0, 64.0, 95.0, 107.0, 133.0, 119.0, 110.0, 116.0, 75.0, 57.0, 27.0, 19.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8339438438415527, -2.7609875202178955, -2.6880311965942383, -2.615074634552002, -2.5421183109283447, -2.4691619873046875, -2.3962056636810303, -2.323249340057373, -2.2502927780151367, -2.1773364543914795, -2.1043801307678223, -2.031423568725586, -1.9584672451019287, -1.8855109214782715, -1.8125545978546143, -1.7395981550216675, -1.6666418313980103, -1.593685507774353, -1.5207290649414062, -1.447772741317749, -1.3748162984848022, -1.301859974861145, -1.2289035320281982, -1.155947208404541, -1.0829908847808838, -1.0100345611572266, -0.9370781183242798, -0.8641217947006226, -0.7911653518676758, -0.7182090282440186, -0.6452526450157166, -0.5722962617874146, -0.4993398189544678, -0.42638343572616577, -0.35342705249786377, -0.28047069907188416, -0.20751431584358215, -0.13455793261528015, -0.06160157918930054, 0.011354804039001465, 0.08431118726730347, 0.15726757049560547, 0.23022393882274628, 0.3031803071498871, 0.3761366903781891, 0.4490930736064911, 0.5220494270324707, 0.5950058102607727, 0.6679621934890747, 0.7409185767173767, 0.8138749599456787, 0.8868312835693359, 0.9597877264022827, 1.03274405002594, 1.1057004928588867, 1.178656816482544, 1.2516131401062012, 1.3245694637298584, 1.3975259065628052, 1.4704822301864624, 1.5434386730194092, 1.6163949966430664, 1.6893513202667236, 1.7623077630996704, 1.8352642059326172]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 7.0, 18.0, 10.0, 14.0, 29.0, 24.0, 46.0, 53.0, 107.0, 169.0, 284.0, 542.0, 1012.0, 2544.0, 12164.0, 764936.0, 254048.0, 8391.0, 2125.0, 874.0, 437.0, 264.0, 142.0, 93.0, 52.0, 41.0, 27.0, 24.0, 13.0, 11.0, 7.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.107421875, -2.0452728271484375, -1.983123779296875, -1.9209747314453125, -1.85882568359375, -1.7966766357421875, -1.734527587890625, -1.6723785400390625, -1.6102294921875, -1.5480804443359375, -1.485931396484375, -1.4237823486328125, -1.36163330078125, -1.2994842529296875, -1.237335205078125, -1.1751861572265625, -1.113037109375, -1.0508880615234375, -0.988739013671875, -0.9265899658203125, -0.86444091796875, -0.8022918701171875, -0.740142822265625, -0.6779937744140625, -0.6158447265625, -0.5536956787109375, -0.491546630859375, -0.4293975830078125, -0.36724853515625, -0.3050994873046875, -0.242950439453125, -0.1808013916015625, -0.11865234375, -0.0565032958984375, 0.005645751953125, 0.0677947998046875, 0.12994384765625, 0.1920928955078125, 0.254241943359375, 0.3163909912109375, 0.3785400390625, 0.4406890869140625, 0.502838134765625, 0.5649871826171875, 0.62713623046875, 0.6892852783203125, 0.751434326171875, 0.8135833740234375, 0.875732421875, 0.9378814697265625, 1.000030517578125, 1.0621795654296875, 1.12432861328125, 1.1864776611328125, 1.248626708984375, 1.3107757568359375, 1.3729248046875, 1.4350738525390625, 1.497222900390625, 1.5593719482421875, 1.62152099609375, 1.6836700439453125, 1.745819091796875, 1.8079681396484375, 1.8701171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 45.0, 115.0, 242.0, 314.0, 175.0, 56.0, 21.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6863784790039062, -0.6701202392578125, -0.6538619995117188, -0.637603759765625, -0.6213455200195312, -0.6050872802734375, -0.5888290405273438, -0.57257080078125, -0.5563125610351562, -0.5400543212890625, -0.5237960815429688, -0.507537841796875, -0.49127960205078125, -0.4750213623046875, -0.45876312255859375, -0.4425048828125, -0.42624664306640625, -0.4099884033203125, -0.39373016357421875, -0.377471923828125, -0.36121368408203125, -0.3449554443359375, -0.32869720458984375, -0.31243896484375, -0.29618072509765625, -0.2799224853515625, -0.26366424560546875, -0.247406005859375, -0.23114776611328125, -0.2148895263671875, -0.19863128662109375, -0.182373046875, -0.16611480712890625, -0.1498565673828125, -0.13359832763671875, -0.117340087890625, -0.10108184814453125, -0.0848236083984375, -0.06856536865234375, -0.05230712890625, -0.03604888916015625, -0.0197906494140625, -0.00353240966796875, 0.012725830078125, 0.02898406982421875, 0.0452423095703125, 0.06150054931640625, 0.0777587890625, 0.09401702880859375, 0.1102752685546875, 0.12653350830078125, 0.142791748046875, 0.15904998779296875, 0.1753082275390625, 0.19156646728515625, 0.20782470703125, 0.22408294677734375, 0.2403411865234375, 0.25659942626953125, 0.272857666015625, 0.28911590576171875, 0.3053741455078125, 0.32163238525390625, 0.337890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 12.0, 5.0, 11.0, 5.0, 16.0, 14.0, 15.0, 19.0, 23.0, 23.0, 43.0, 73.0, 120.0, 277.0, 863.0, 3136.0, 18032.0, 167766.0, 775208.0, 70466.0, 9394.0, 1907.0, 539.0, 201.0, 103.0, 56.0, 39.0, 19.0, 30.0, 21.0, 19.0, 17.0, 23.0, 9.0, 12.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.1904296875, -1.1567306518554688, -1.1230316162109375, -1.0893325805664062, -1.055633544921875, -1.0219345092773438, -0.9882354736328125, -0.9545364379882812, -0.92083740234375, -0.8871383666992188, -0.8534393310546875, -0.8197402954101562, -0.786041259765625, -0.7523422241210938, -0.7186431884765625, -0.6849441528320312, -0.6512451171875, -0.6175460815429688, -0.5838470458984375, -0.5501480102539062, -0.516448974609375, -0.48274993896484375, -0.4490509033203125, -0.41535186767578125, -0.38165283203125, -0.34795379638671875, -0.3142547607421875, -0.28055572509765625, -0.246856689453125, -0.21315765380859375, -0.1794586181640625, -0.14575958251953125, -0.112060546875, -0.07836151123046875, -0.0446624755859375, -0.01096343994140625, 0.022735595703125, 0.05643463134765625, 0.0901336669921875, 0.12383270263671875, 0.15753173828125, 0.19123077392578125, 0.2249298095703125, 0.25862884521484375, 0.292327880859375, 0.32602691650390625, 0.3597259521484375, 0.39342498779296875, 0.4271240234375, 0.46082305908203125, 0.4945220947265625, 0.5282211303710938, 0.561920166015625, 0.5956192016601562, 0.6293182373046875, 0.6630172729492188, 0.69671630859375, 0.7304153442382812, 0.7641143798828125, 0.7978134155273438, 0.831512451171875, 0.8652114868164062, 0.8989105224609375, 0.9326095581054688, 0.96630859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 10.0, 13.0, 20.0, 15.0, 21.0, 28.0, 26.0, 15.0, 31.0, 37.0, 41.0, 35.0, 44.0, 37.0, 38.0, 45.0, 40.0, 56.0, 53.0, 44.0, 47.0, 37.0, 36.0, 37.0, 26.0, 22.0, 15.0, 22.0, 11.0, 17.0, 13.0, 7.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54296875, -0.5238113403320312, -0.5046539306640625, -0.48549652099609375, -0.466339111328125, -0.44718170166015625, -0.4280242919921875, -0.40886688232421875, -0.38970947265625, -0.37055206298828125, -0.3513946533203125, -0.33223724365234375, -0.313079833984375, -0.29392242431640625, -0.2747650146484375, -0.25560760498046875, -0.2364501953125, -0.21729278564453125, -0.1981353759765625, -0.17897796630859375, -0.159820556640625, -0.14066314697265625, -0.1215057373046875, -0.10234832763671875, -0.08319091796875, -0.06403350830078125, -0.0448760986328125, -0.02571868896484375, -0.006561279296875, 0.01259613037109375, 0.0317535400390625, 0.05091094970703125, 0.070068359375, 0.08922576904296875, 0.1083831787109375, 0.12754058837890625, 0.146697998046875, 0.16585540771484375, 0.1850128173828125, 0.20417022705078125, 0.22332763671875, 0.24248504638671875, 0.2616424560546875, 0.28079986572265625, 0.299957275390625, 0.31911468505859375, 0.3382720947265625, 0.35742950439453125, 0.3765869140625, 0.39574432373046875, 0.4149017333984375, 0.43405914306640625, 0.453216552734375, 0.47237396240234375, 0.4915313720703125, 0.5106887817382812, 0.52984619140625, 0.5490036010742188, 0.5681610107421875, 0.5873184204101562, 0.606475830078125, 0.6256332397460938, 0.6447906494140625, 0.6639480590820312, 0.68310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 15.0, 19.0, 23.0, 53.0, 70.0, 122.0, 285.0, 551.0, 1077.0, 2355.0, 6812.0, 30985.0, 669660.0, 307677.0, 19897.0, 5109.0, 1984.0, 870.0, 386.0, 225.0, 104.0, 76.0, 50.0, 36.0, 23.0, 26.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24158096313476562, -0.23291778564453125, -0.22425460815429688, -0.2155914306640625, -0.20692825317382812, -0.19826507568359375, -0.18960189819335938, -0.180938720703125, -0.17227554321289062, -0.16361236572265625, -0.15494918823242188, -0.1462860107421875, -0.13762283325195312, -0.12895965576171875, -0.12029647827148438, -0.11163330078125, -0.10297012329101562, -0.09430694580078125, -0.08564376831054688, -0.0769805908203125, -0.06831741333007812, -0.05965423583984375, -0.050991058349609375, -0.042327880859375, -0.033664703369140625, -0.02500152587890625, -0.016338348388671875, -0.0076751708984375, 0.000988006591796875, 0.00965118408203125, 0.018314361572265625, 0.0269775390625, 0.035640716552734375, 0.04430389404296875, 0.052967071533203125, 0.0616302490234375, 0.07029342651367188, 0.07895660400390625, 0.08761978149414062, 0.096282958984375, 0.10494613647460938, 0.11360931396484375, 0.12227249145507812, 0.1309356689453125, 0.13959884643554688, 0.14826202392578125, 0.15692520141601562, 0.16558837890625, 0.17425155639648438, 0.18291473388671875, 0.19157791137695312, 0.2002410888671875, 0.20890426635742188, 0.21756744384765625, 0.22623062133789062, 0.234893798828125, 0.24355697631835938, 0.25222015380859375, 0.2608833312988281, 0.2695465087890625, 0.2782096862792969, 0.28687286376953125, 0.2955360412597656, 0.30419921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 13.0, 48.0, 72.0, 134.0, 258.0, 220.0, 132.0, 49.0, 30.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.7913210690021515e-05, -3.672577440738678e-05, -3.5538338124752045e-05, -3.435090184211731e-05, -3.3163465559482574e-05, -3.197602927684784e-05, -3.0788592994213104e-05, -2.960115671157837e-05, -2.8413720428943634e-05, -2.72262841463089e-05, -2.6038847863674164e-05, -2.485141158103943e-05, -2.3663975298404694e-05, -2.247653901576996e-05, -2.1289102733135223e-05, -2.0101666450500488e-05, -1.8914230167865753e-05, -1.7726793885231018e-05, -1.6539357602596283e-05, -1.5351921319961548e-05, -1.4164485037326813e-05, -1.2977048754692078e-05, -1.1789612472057343e-05, -1.0602176189422607e-05, -9.414739906787872e-06, -8.227303624153137e-06, -7.039867341518402e-06, -5.852431058883667e-06, -4.664994776248932e-06, -3.4775584936141968e-06, -2.2901222109794617e-06, -1.1026859283447266e-06, 8.475035429000854e-08, 1.2721866369247437e-06, 2.4596229195594788e-06, 3.647059202194214e-06, 4.834495484828949e-06, 6.021931767463684e-06, 7.209368050098419e-06, 8.396804332733154e-06, 9.58424061536789e-06, 1.0771676898002625e-05, 1.195911318063736e-05, 1.3146549463272095e-05, 1.433398574590683e-05, 1.5521422028541565e-05, 1.67088583111763e-05, 1.7896294593811035e-05, 1.908373087644577e-05, 2.0271167159080505e-05, 2.145860344171524e-05, 2.2646039724349976e-05, 2.383347600698471e-05, 2.5020912289619446e-05, 2.620834857225418e-05, 2.7395784854888916e-05, 2.858322113752365e-05, 2.9770657420158386e-05, 3.095809370279312e-05, 3.2145529985427856e-05, 3.333296626806259e-05, 3.452040255069733e-05, 3.570783883333206e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 7.0, 16.0, 28.0, 53.0, 130.0, 386.0, 1778.0, 26249.0, 999757.0, 18079.0, 1482.0, 367.0, 110.0, 48.0, 21.0, 9.0, 9.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.680511474609375, -0.65887451171875, -0.637237548828125, -0.6156005859375, -0.593963623046875, -0.57232666015625, -0.550689697265625, -0.529052734375, -0.507415771484375, -0.48577880859375, -0.464141845703125, -0.4425048828125, -0.420867919921875, -0.39923095703125, -0.377593994140625, -0.35595703125, -0.334320068359375, -0.31268310546875, -0.291046142578125, -0.2694091796875, -0.247772216796875, -0.22613525390625, -0.204498291015625, -0.182861328125, -0.161224365234375, -0.13958740234375, -0.117950439453125, -0.0963134765625, -0.074676513671875, -0.05303955078125, -0.031402587890625, -0.009765625, 0.011871337890625, 0.03350830078125, 0.055145263671875, 0.0767822265625, 0.098419189453125, 0.12005615234375, 0.141693115234375, 0.163330078125, 0.184967041015625, 0.20660400390625, 0.228240966796875, 0.2498779296875, 0.271514892578125, 0.29315185546875, 0.314788818359375, 0.33642578125, 0.358062744140625, 0.37969970703125, 0.401336669921875, 0.4229736328125, 0.444610595703125, 0.46624755859375, 0.487884521484375, 0.509521484375, 0.531158447265625, 0.55279541015625, 0.574432373046875, 0.5960693359375, 0.617706298828125, 0.63934326171875, 0.660980224609375, 0.6826171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 3.0, 10.0, 9.0, 18.0, 50.0, 88.0, 167.0, 236.0, 163.0, 99.0, 54.0, 41.0, 18.0, 11.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3567466735839844, -0.34508514404296875, -0.3334236145019531, -0.3217620849609375, -0.3101005554199219, -0.29843902587890625, -0.2867774963378906, -0.275115966796875, -0.2634544372558594, -0.25179290771484375, -0.24013137817382812, -0.2284698486328125, -0.21680831909179688, -0.20514678955078125, -0.19348526000976562, -0.18182373046875, -0.17016220092773438, -0.15850067138671875, -0.14683914184570312, -0.1351776123046875, -0.12351608276367188, -0.11185455322265625, -0.10019302368164062, -0.088531494140625, -0.07686996459960938, -0.06520843505859375, -0.053546905517578125, -0.0418853759765625, -0.030223846435546875, -0.01856231689453125, -0.006900787353515625, 0.0047607421875, 0.016422271728515625, 0.02808380126953125, 0.039745330810546875, 0.0514068603515625, 0.06306838989257812, 0.07472991943359375, 0.08639144897460938, 0.098052978515625, 0.10971450805664062, 0.12137603759765625, 0.13303756713867188, 0.1446990966796875, 0.15636062622070312, 0.16802215576171875, 0.17968368530273438, 0.19134521484375, 0.20300674438476562, 0.21466827392578125, 0.22632980346679688, 0.2379913330078125, 0.24965286254882812, 0.26131439208984375, 0.2729759216308594, 0.284637451171875, 0.2962989807128906, 0.30796051025390625, 0.3196220397949219, 0.3312835693359375, 0.3429450988769531, 0.35460662841796875, 0.3662681579589844, 0.3779296875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 20.0, 52.0, 160.0, 442.0, 200.0, 79.0, 23.0, 17.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.938676834106445, -5.698006629943848, -5.45733642578125, -5.216666221618652, -4.975996017456055, -4.735325813293457, -4.494655609130859, -4.253985404968262, -4.013315200805664, -3.7726449966430664, -3.5319747924804688, -3.291304588317871, -3.0506343841552734, -2.809964179992676, -2.5692942142486572, -2.3286240100860596, -2.087954044342041, -1.8472838401794434, -1.6066136360168457, -1.3659435510635376, -1.12527334690094, -0.8846031427383423, -0.6439330577850342, -0.4032628536224365, -0.16259264945983887, 0.0780775249004364, 0.31874769926071167, 0.5594178438186646, 0.8000880479812622, 1.0407582521438599, 1.281428337097168, 1.5220985412597656, 1.7627687454223633, 2.003438949584961, 2.2441091537475586, 2.4847793579101562, 2.725449562072754, 2.9661197662353516, 3.20678973197937, 3.4474599361419678, 3.6881301403045654, 3.928800344467163, 4.169470310211182, 4.410140514373779, 4.650810718536377, 4.891480922698975, 5.132151126861572, 5.37282133102417, 5.613491535186768, 5.854161739349365, 6.094831943511963, 6.3355021476745605, 6.576172351837158, 6.816842555999756, 7.057512283325195, 7.298182487487793, 7.538852691650391, 7.779522895812988, 8.020193099975586, 8.260863304138184, 8.501533508300781, 8.742203712463379, 8.982873916625977, 9.223544120788574, 9.464214324951172]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 9.0, 14.0, 15.0, 15.0, 21.0, 22.0, 31.0, 37.0, 34.0, 57.0, 60.0, 62.0, 65.0, 84.0, 69.0, 51.0, 66.0, 61.0, 47.0, 44.0, 25.0, 33.0, 20.0, 15.0, 15.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.111644744873047, -3.957146167755127, -3.802647590637207, -3.648149013519287, -3.493650197982788, -3.339151620864868, -3.1846530437469482, -3.030154228210449, -2.8756556510925293, -2.7211570739746094, -2.5666584968566895, -2.4121599197387695, -2.2576611042022705, -2.1031625270843506, -1.9486639499664307, -1.7941652536392212, -1.6396667957305908, -1.485168218612671, -1.3306695222854614, -1.1761709451675415, -1.021672248840332, -0.8671736717224121, -0.7126750946044922, -0.5581763982772827, -0.4036778211593628, -0.2491791993379593, -0.09468057751655579, 0.05981802940368652, 0.21431666612625122, 0.3688153028488159, 0.5233138799667358, 0.6778125762939453, 0.8323111534118652, 0.9868097901344299, 1.1413084268569946, 1.2958070039749146, 1.450305700302124, 1.604804277420044, 1.7593028545379639, 1.9138015508651733, 2.068300247192383, 2.2227988243103027, 2.3772974014282227, 2.5317959785461426, 2.6862947940826416, 2.8407933712005615, 2.9952919483184814, 3.1497907638549805, 3.3042891025543213, 3.458787679672241, 3.613286256790161, 3.76778507232666, 3.92228364944458, 4.0767822265625, 4.23128080368042, 4.38577938079834, 4.54027795791626, 4.69477653503418, 4.8492751121521, 5.0037736892700195, 5.1582722663879395, 5.312770843505859, 5.4672698974609375, 5.621768474578857, 5.776267051696777]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 22.0, 42.0, 150.0, 643.0, 302639.0, 3889996.0, 546.0, 130.0, 45.0, 15.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -6.032196044921875, -5.88861083984375, -5.745025634765625, -5.6014404296875, -5.457855224609375, -5.31427001953125, -5.170684814453125, -5.027099609375, -4.883514404296875, -4.73992919921875, -4.596343994140625, -4.4527587890625, -4.309173583984375, -4.16558837890625, -4.022003173828125, -3.87841796875, -3.734832763671875, -3.59124755859375, -3.447662353515625, -3.3040771484375, -3.160491943359375, -3.01690673828125, -2.873321533203125, -2.729736328125, -2.586151123046875, -2.44256591796875, -2.298980712890625, -2.1553955078125, -2.011810302734375, -1.86822509765625, -1.724639892578125, -1.5810546875, -1.437469482421875, -1.29388427734375, -1.150299072265625, -1.0067138671875, -0.863128662109375, -0.71954345703125, -0.575958251953125, -0.432373046875, -0.288787841796875, -0.14520263671875, -0.001617431640625, 0.1419677734375, 0.285552978515625, 0.42913818359375, 0.572723388671875, 0.71630859375, 0.859893798828125, 1.00347900390625, 1.147064208984375, 1.2906494140625, 1.434234619140625, 1.57781982421875, 1.721405029296875, 1.864990234375, 2.008575439453125, 2.15216064453125, 2.295745849609375, 2.4393310546875, 2.582916259765625, 2.72650146484375, 2.870086669921875, 3.013671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 15.0, 36.0, 115.0, 197.0, 290.0, 207.0, 79.0, 33.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71630859375, -0.6998023986816406, -0.6832962036132812, -0.6667900085449219, -0.6502838134765625, -0.6337776184082031, -0.6172714233398438, -0.6007652282714844, -0.584259033203125, -0.5677528381347656, -0.5512466430664062, -0.5347404479980469, -0.5182342529296875, -0.5017280578613281, -0.48522186279296875, -0.4687156677246094, -0.45220947265625, -0.4357032775878906, -0.41919708251953125, -0.4026908874511719, -0.3861846923828125, -0.3696784973144531, -0.35317230224609375, -0.3366661071777344, -0.320159912109375, -0.3036537170410156, -0.28714752197265625, -0.2706413269042969, -0.2541351318359375, -0.23762893676757812, -0.22112274169921875, -0.20461654663085938, -0.1881103515625, -0.17160415649414062, -0.15509796142578125, -0.13859176635742188, -0.1220855712890625, -0.10557937622070312, -0.08907318115234375, -0.07256698608398438, -0.056060791015625, -0.039554595947265625, -0.02304840087890625, -0.006542205810546875, 0.0099639892578125, 0.026470184326171875, 0.04297637939453125, 0.059482574462890625, 0.07598876953125, 0.09249496459960938, 0.10900115966796875, 0.12550735473632812, 0.1420135498046875, 0.15851974487304688, 0.17502593994140625, 0.19153213500976562, 0.208038330078125, 0.22454452514648438, 0.24105072021484375, 0.2575569152832031, 0.2740631103515625, 0.2905693054199219, 0.30707550048828125, 0.3235816955566406, 0.340087890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 17.0, 37.0, 48.0, 114.0, 188.0, 458.0, 1188.0, 4644.0, 32358.0, 4081709.0, 64205.0, 6761.0, 1619.0, 504.0, 202.0, 112.0, 45.0, 21.0, 9.0, 11.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5614242553710938, -0.5354461669921875, -0.5094680786132812, -0.483489990234375, -0.45751190185546875, -0.4315338134765625, -0.40555572509765625, -0.37957763671875, -0.35359954833984375, -0.3276214599609375, -0.30164337158203125, -0.275665283203125, -0.24968719482421875, -0.2237091064453125, -0.19773101806640625, -0.1717529296875, -0.14577484130859375, -0.1197967529296875, -0.09381866455078125, -0.067840576171875, -0.04186248779296875, -0.0158843994140625, 0.01009368896484375, 0.03607177734375, 0.06204986572265625, 0.0880279541015625, 0.11400604248046875, 0.139984130859375, 0.16596221923828125, 0.1919403076171875, 0.21791839599609375, 0.243896484375, 0.26987457275390625, 0.2958526611328125, 0.32183074951171875, 0.347808837890625, 0.37378692626953125, 0.3997650146484375, 0.42574310302734375, 0.45172119140625, 0.47769927978515625, 0.5036773681640625, 0.5296554565429688, 0.555633544921875, 0.5816116333007812, 0.6075897216796875, 0.6335678100585938, 0.6595458984375, 0.6855239868164062, 0.7115020751953125, 0.7374801635742188, 0.763458251953125, 0.7894363403320312, 0.8154144287109375, 0.8413925170898438, 0.86737060546875, 0.8933486938476562, 0.9193267822265625, 0.9453048706054688, 0.971282958984375, 0.9972610473632812, 1.0232391357421875, 1.0492172241210938, 1.0751953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 14.0, 22.0, 48.0, 122.0, 497.0, 3038.0, 175.0, 44.0, 23.0, 23.0, 19.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3095703125, -0.301025390625, -0.29248046875, -0.283935546875, -0.275390625, -0.266845703125, -0.25830078125, -0.249755859375, -0.2412109375, -0.232666015625, -0.22412109375, -0.215576171875, -0.20703125, -0.198486328125, -0.18994140625, -0.181396484375, -0.1728515625, -0.164306640625, -0.15576171875, -0.147216796875, -0.138671875, -0.130126953125, -0.12158203125, -0.113037109375, -0.1044921875, -0.095947265625, -0.08740234375, -0.078857421875, -0.0703125, -0.061767578125, -0.05322265625, -0.044677734375, -0.0361328125, -0.027587890625, -0.01904296875, -0.010498046875, -0.001953125, 0.006591796875, 0.01513671875, 0.023681640625, 0.0322265625, 0.040771484375, 0.04931640625, 0.057861328125, 0.06640625, 0.074951171875, 0.08349609375, 0.092041015625, 0.1005859375, 0.109130859375, 0.11767578125, 0.126220703125, 0.134765625, 0.143310546875, 0.15185546875, 0.160400390625, 0.1689453125, 0.177490234375, 0.18603515625, 0.194580078125, 0.203125, 0.211669921875, 0.22021484375, 0.228759765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 33.0, 147.0, 533.0, 241.0, 41.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.640495777130127, -3.567335605621338, -3.494175434112549, -3.4210152626037598, -3.3478550910949707, -3.2746951580047607, -3.2015349864959717, -3.1283748149871826, -3.0552146434783936, -2.9820544719696045, -2.9088943004608154, -2.8357341289520264, -2.7625741958618164, -2.6894140243530273, -2.6162538528442383, -2.543093681335449, -2.46993350982666, -2.396773338317871, -2.323613166809082, -2.250452995300293, -2.177292823791504, -2.104132890701294, -2.030972719192505, -1.9578125476837158, -1.8846523761749268, -1.8114922046661377, -1.7383320331573486, -1.6651719808578491, -1.59201180934906, -1.518851637840271, -1.4456915855407715, -1.3725314140319824, -1.2993710041046143, -1.2262108325958252, -1.1530506610870361, -1.0798906087875366, -1.0067304372787476, -0.9335702657699585, -0.8604101538658142, -0.7872500419616699, -0.7140898704528809, -0.6409296989440918, -0.5677695870399475, -0.49460944533348083, -0.42144930362701416, -0.3482891619205475, -0.2751290202140808, -0.20196890830993652, -0.12880873680114746, -0.055648595094680786, 0.01751154661178589, 0.09067168831825256, 0.16383183002471924, 0.2369919717311859, 0.3101521134376526, 0.3833122253417969, 0.45647239685058594, 0.529632568359375, 0.6027926802635193, 0.6759527921676636, 0.7491129636764526, 0.8222731351852417, 0.895433247089386, 0.9685933589935303, 1.0417535305023193]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 7.0, 11.0, 18.0, 15.0, 29.0, 32.0, 26.0, 44.0, 64.0, 55.0, 60.0, 50.0, 48.0, 51.0, 69.0, 51.0, 56.0, 64.0, 48.0, 40.0, 40.0, 30.0, 32.0, 18.0, 10.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8985940217971802, -0.8755716681480408, -0.8525493144989014, -0.8295270204544067, -0.8065046668052673, -0.7834823131561279, -0.7604599595069885, -0.7374376058578491, -0.7144153118133545, -0.6913929581642151, -0.6683706045150757, -0.645348310470581, -0.6223259568214417, -0.5993036031723022, -0.5762812495231628, -0.5532588958740234, -0.530236542224884, -0.5072141885757446, -0.4841918647289276, -0.4611695110797882, -0.4381471872329712, -0.4151248335838318, -0.3921024799346924, -0.369080126285553, -0.34605780243873596, -0.32303544878959656, -0.30001312494277954, -0.27699077129364014, -0.25396841764450073, -0.23094609379768372, -0.2079237401485443, -0.1849014014005661, -0.16187900304794312, -0.1388566642999649, -0.1158343181014061, -0.09281197190284729, -0.06978963315486908, -0.04676729440689087, -0.023744940757751465, -0.0007226020097732544, 0.022299736738204956, 0.045322079211473465, 0.06834442168474197, 0.09136676788330078, 0.11438910663127899, 0.1374114453792572, 0.1604337990283966, 0.18345613777637482, 0.20647847652435303, 0.22950081527233124, 0.25252315402030945, 0.27554550766944885, 0.29856783151626587, 0.3215901851654053, 0.3446125388145447, 0.3676348924636841, 0.3906572163105011, 0.4136795699596405, 0.4367018938064575, 0.4597242474555969, 0.48274660110473633, 0.505768895149231, 0.5287913084030151, 0.5518136024475098, 0.5748359560966492]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 12.0, 19.0, 30.0, 46.0, 64.0, 72.0, 123.0, 246.0, 477.0, 1053.0, 2690.0, 14797.0, 835382.0, 182714.0, 7199.0, 1906.0, 772.0, 389.0, 192.0, 109.0, 55.0, 33.0, 46.0, 23.0, 21.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.189453125, -2.122772216796875, -2.05609130859375, -1.989410400390625, -1.9227294921875, -1.856048583984375, -1.78936767578125, -1.722686767578125, -1.656005859375, -1.589324951171875, -1.52264404296875, -1.455963134765625, -1.3892822265625, -1.322601318359375, -1.25592041015625, -1.189239501953125, -1.12255859375, -1.055877685546875, -0.98919677734375, -0.922515869140625, -0.8558349609375, -0.789154052734375, -0.72247314453125, -0.655792236328125, -0.589111328125, -0.522430419921875, -0.45574951171875, -0.389068603515625, -0.3223876953125, -0.255706787109375, -0.18902587890625, -0.122344970703125, -0.0556640625, 0.011016845703125, 0.07769775390625, 0.144378662109375, 0.2110595703125, 0.277740478515625, 0.34442138671875, 0.411102294921875, 0.477783203125, 0.544464111328125, 0.61114501953125, 0.677825927734375, 0.7445068359375, 0.811187744140625, 0.87786865234375, 0.944549560546875, 1.01123046875, 1.077911376953125, 1.14459228515625, 1.211273193359375, 1.2779541015625, 1.344635009765625, 1.41131591796875, 1.477996826171875, 1.544677734375, 1.611358642578125, 1.67803955078125, 1.744720458984375, 1.8114013671875, 1.878082275390625, 1.94476318359375, 2.011444091796875, 2.078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 16.0, 44.0, 125.0, 229.0, 258.0, 196.0, 71.0, 35.0, 8.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6945114135742188, -0.6780853271484375, -0.6616592407226562, -0.645233154296875, -0.6288070678710938, -0.6123809814453125, -0.5959548950195312, -0.57952880859375, -0.5631027221679688, -0.5466766357421875, -0.5302505493164062, -0.513824462890625, -0.49739837646484375, -0.4809722900390625, -0.46454620361328125, -0.4481201171875, -0.43169403076171875, -0.4152679443359375, -0.39884185791015625, -0.382415771484375, -0.36598968505859375, -0.3495635986328125, -0.33313751220703125, -0.31671142578125, -0.30028533935546875, -0.2838592529296875, -0.26743316650390625, -0.251007080078125, -0.23458099365234375, -0.2181549072265625, -0.20172882080078125, -0.185302734375, -0.16887664794921875, -0.1524505615234375, -0.13602447509765625, -0.119598388671875, -0.10317230224609375, -0.0867462158203125, -0.07032012939453125, -0.05389404296875, -0.03746795654296875, -0.0210418701171875, -0.00461578369140625, 0.011810302734375, 0.02823638916015625, 0.0446624755859375, 0.06108856201171875, 0.0775146484375, 0.09394073486328125, 0.1103668212890625, 0.12679290771484375, 0.143218994140625, 0.15964508056640625, 0.1760711669921875, 0.19249725341796875, 0.20892333984375, 0.22534942626953125, 0.2417755126953125, 0.25820159912109375, 0.274627685546875, 0.29105377197265625, 0.3074798583984375, 0.32390594482421875, 0.34033203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 12.0, 15.0, 22.0, 25.0, 27.0, 25.0, 50.0, 52.0, 115.0, 255.0, 737.0, 2519.0, 13124.0, 110679.0, 804216.0, 100729.0, 12228.0, 2378.0, 682.0, 252.0, 121.0, 56.0, 48.0, 29.0, 23.0, 23.0, 17.0, 12.0, 15.0, 9.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2626953125, -1.22607421875, -1.189453125, -1.15283203125, -1.1162109375, -1.07958984375, -1.04296875, -1.00634765625, -0.9697265625, -0.93310546875, -0.896484375, -0.85986328125, -0.8232421875, -0.78662109375, -0.75, -0.71337890625, -0.6767578125, -0.64013671875, -0.603515625, -0.56689453125, -0.5302734375, -0.49365234375, -0.45703125, -0.42041015625, -0.3837890625, -0.34716796875, -0.310546875, -0.27392578125, -0.2373046875, -0.20068359375, -0.1640625, -0.12744140625, -0.0908203125, -0.05419921875, -0.017578125, 0.01904296875, 0.0556640625, 0.09228515625, 0.12890625, 0.16552734375, 0.2021484375, 0.23876953125, 0.275390625, 0.31201171875, 0.3486328125, 0.38525390625, 0.421875, 0.45849609375, 0.4951171875, 0.53173828125, 0.568359375, 0.60498046875, 0.6416015625, 0.67822265625, 0.71484375, 0.75146484375, 0.7880859375, 0.82470703125, 0.861328125, 0.89794921875, 0.9345703125, 0.97119140625, 1.0078125, 1.04443359375, 1.0810546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 16.0, 11.0, 19.0, 21.0, 22.0, 27.0, 35.0, 34.0, 37.0, 36.0, 41.0, 44.0, 54.0, 44.0, 56.0, 56.0, 48.0, 52.0, 31.0, 44.0, 33.0, 32.0, 31.0, 17.0, 35.0, 17.0, 17.0, 16.0, 13.0, 8.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6008453369140625, -0.579620361328125, -0.5583953857421875, -0.53717041015625, -0.5159454345703125, -0.494720458984375, -0.4734954833984375, -0.4522705078125, -0.4310455322265625, -0.409820556640625, -0.3885955810546875, -0.36737060546875, -0.3461456298828125, -0.324920654296875, -0.3036956787109375, -0.282470703125, -0.2612457275390625, -0.240020751953125, -0.2187957763671875, -0.19757080078125, -0.1763458251953125, -0.155120849609375, -0.1338958740234375, -0.1126708984375, -0.0914459228515625, -0.070220947265625, -0.0489959716796875, -0.02777099609375, -0.0065460205078125, 0.014678955078125, 0.0359039306640625, 0.05712890625, 0.0783538818359375, 0.099578857421875, 0.1208038330078125, 0.14202880859375, 0.1632537841796875, 0.184478759765625, 0.2057037353515625, 0.2269287109375, 0.2481536865234375, 0.269378662109375, 0.2906036376953125, 0.31182861328125, 0.3330535888671875, 0.354278564453125, 0.3755035400390625, 0.396728515625, 0.4179534912109375, 0.439178466796875, 0.4604034423828125, 0.48162841796875, 0.5028533935546875, 0.524078369140625, 0.5453033447265625, 0.5665283203125, 0.5877532958984375, 0.608978271484375, 0.6302032470703125, 0.65142822265625, 0.6726531982421875, 0.693878173828125, 0.7151031494140625, 0.736328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 18.0, 22.0, 37.0, 52.0, 78.0, 158.0, 244.0, 533.0, 1176.0, 3359.0, 13484.0, 92631.0, 770763.0, 141505.0, 17625.0, 4168.0, 1396.0, 577.0, 291.0, 139.0, 102.0, 64.0, 32.0, 31.0, 13.0, 7.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2410888671875, -0.23320579528808594, -0.22532272338867188, -0.2174396514892578, -0.20955657958984375, -0.2016735076904297, -0.19379043579101562, -0.18590736389160156, -0.1780242919921875, -0.17014122009277344, -0.16225814819335938, -0.1543750762939453, -0.14649200439453125, -0.1386089324951172, -0.13072586059570312, -0.12284278869628906, -0.114959716796875, -0.10707664489746094, -0.09919357299804688, -0.09131050109863281, -0.08342742919921875, -0.07554435729980469, -0.06766128540039062, -0.05977821350097656, -0.0518951416015625, -0.04401206970214844, -0.036128997802734375, -0.028245925903320312, -0.02036285400390625, -0.012479782104492188, -0.004596710205078125, 0.0032863616943359375, 0.01116943359375, 0.019052505493164062, 0.026935577392578125, 0.03481864929199219, 0.04270172119140625, 0.05058479309082031, 0.058467864990234375, 0.06635093688964844, 0.0742340087890625, 0.08211708068847656, 0.09000015258789062, 0.09788322448730469, 0.10576629638671875, 0.11364936828613281, 0.12153244018554688, 0.12941551208496094, 0.137298583984375, 0.14518165588378906, 0.15306472778320312, 0.1609477996826172, 0.16883087158203125, 0.1767139434814453, 0.18459701538085938, 0.19248008728027344, 0.2003631591796875, 0.20824623107910156, 0.21612930297851562, 0.2240123748779297, 0.23189544677734375, 0.2397785186767578, 0.24766159057617188, 0.25554466247558594, 0.263427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 7.0, 15.0, 33.0, 35.0, 53.0, 88.0, 112.0, 161.0, 118.0, 124.0, 89.0, 57.0, 30.0, 22.0, 11.0, 9.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.297494888305664e-05, -4.209205508232117e-05, -4.120916128158569e-05, -4.032626748085022e-05, -3.9443373680114746e-05, -3.856047987937927e-05, -3.76775860786438e-05, -3.6794692277908325e-05, -3.591179847717285e-05, -3.502890467643738e-05, -3.4146010875701904e-05, -3.326311707496643e-05, -3.238022327423096e-05, -3.1497329473495483e-05, -3.061443567276001e-05, -2.9731541872024536e-05, -2.8848648071289062e-05, -2.796575427055359e-05, -2.7082860469818115e-05, -2.619996666908264e-05, -2.5317072868347168e-05, -2.4434179067611694e-05, -2.355128526687622e-05, -2.2668391466140747e-05, -2.1785497665405273e-05, -2.09026038646698e-05, -2.0019710063934326e-05, -1.9136816263198853e-05, -1.825392246246338e-05, -1.7371028661727905e-05, -1.648813486099243e-05, -1.5605241060256958e-05, -1.4722347259521484e-05, -1.383945345878601e-05, -1.2956559658050537e-05, -1.2073665857315063e-05, -1.119077205657959e-05, -1.0307878255844116e-05, -9.424984455108643e-06, -8.542090654373169e-06, -7.659196853637695e-06, -6.776303052902222e-06, -5.893409252166748e-06, -5.010515451431274e-06, -4.127621650695801e-06, -3.244727849960327e-06, -2.3618340492248535e-06, -1.4789402484893799e-06, -5.960464477539062e-07, 2.868473529815674e-07, 1.169741153717041e-06, 2.0526349544525146e-06, 2.9355287551879883e-06, 3.818422555923462e-06, 4.7013163566589355e-06, 5.584210157394409e-06, 6.467103958129883e-06, 7.3499977588653564e-06, 8.23289155960083e-06, 9.115785360336304e-06, 9.998679161071777e-06, 1.0881572961807251e-05, 1.1764466762542725e-05, 1.2647360563278198e-05, 1.3530254364013672e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 2.0, 11.0, 6.0, 12.0, 15.0, 12.0, 23.0, 42.0, 71.0, 111.0, 282.0, 625.0, 2113.0, 10111.0, 83117.0, 840726.0, 96757.0, 10901.0, 2323.0, 673.0, 251.0, 123.0, 69.0, 36.0, 20.0, 23.0, 19.0, 12.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.25615692138671875, -0.2471771240234375, -0.23819732666015625, -0.229217529296875, -0.22023773193359375, -0.2112579345703125, -0.20227813720703125, -0.19329833984375, -0.18431854248046875, -0.1753387451171875, -0.16635894775390625, -0.157379150390625, -0.14839935302734375, -0.1394195556640625, -0.13043975830078125, -0.1214599609375, -0.11248016357421875, -0.1035003662109375, -0.09452056884765625, -0.085540771484375, -0.07656097412109375, -0.0675811767578125, -0.05860137939453125, -0.04962158203125, -0.04064178466796875, -0.0316619873046875, -0.02268218994140625, -0.013702392578125, -0.00472259521484375, 0.0042572021484375, 0.01323699951171875, 0.022216796875, 0.03119659423828125, 0.0401763916015625, 0.04915618896484375, 0.058135986328125, 0.06711578369140625, 0.0760955810546875, 0.08507537841796875, 0.09405517578125, 0.10303497314453125, 0.1120147705078125, 0.12099456787109375, 0.129974365234375, 0.13895416259765625, 0.1479339599609375, 0.15691375732421875, 0.1658935546875, 0.17487335205078125, 0.1838531494140625, 0.19283294677734375, 0.201812744140625, 0.21079254150390625, 0.2197723388671875, 0.22875213623046875, 0.23773193359375, 0.24671173095703125, 0.2556915283203125, 0.26467132568359375, 0.273651123046875, 0.28263092041015625, 0.2916107177734375, 0.30059051513671875, 0.3095703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 5.0, 8.0, 13.0, 15.0, 12.0, 15.0, 26.0, 23.0, 39.0, 32.0, 65.0, 81.0, 76.0, 81.0, 72.0, 68.0, 55.0, 54.0, 47.0, 42.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 11.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1651611328125, -0.16042709350585938, -0.15569305419921875, -0.15095901489257812, -0.1462249755859375, -0.14149093627929688, -0.13675689697265625, -0.13202285766601562, -0.127288818359375, -0.12255477905273438, -0.11782073974609375, -0.11308670043945312, -0.1083526611328125, -0.10361862182617188, -0.09888458251953125, -0.09415054321289062, -0.08941650390625, -0.08468246459960938, -0.07994842529296875, -0.07521438598632812, -0.0704803466796875, -0.06574630737304688, -0.06101226806640625, -0.056278228759765625, -0.051544189453125, -0.046810150146484375, -0.04207611083984375, -0.037342071533203125, -0.0326080322265625, -0.027873992919921875, -0.02313995361328125, -0.018405914306640625, -0.013671875, -0.008937835693359375, -0.00420379638671875, 0.000530242919921875, 0.0052642822265625, 0.009998321533203125, 0.01473236083984375, 0.019466400146484375, 0.024200439453125, 0.028934478759765625, 0.03366851806640625, 0.038402557373046875, 0.0431365966796875, 0.047870635986328125, 0.05260467529296875, 0.057338714599609375, 0.06207275390625, 0.06680679321289062, 0.07154083251953125, 0.07627487182617188, 0.0810089111328125, 0.08574295043945312, 0.09047698974609375, 0.09521102905273438, 0.099945068359375, 0.10467910766601562, 0.10941314697265625, 0.11414718627929688, 0.1188812255859375, 0.12361526489257812, 0.12834930419921875, 0.13308334350585938, 0.1378173828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 18.0, 50.0, 187.0, 503.0, 171.0, 49.0, 16.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.74199104309082, -16.41053009033203, -16.079071044921875, -15.747610092163086, -15.416150093078613, -15.08469009399414, -14.753229141235352, -14.421769142150879, -14.090309143066406, -13.758849143981934, -13.427389144897461, -13.095928192138672, -12.7644681930542, -12.433008193969727, -12.101547241210938, -11.770087242126465, -11.438627243041992, -11.10716724395752, -10.775707244873047, -10.444246292114258, -10.112786293029785, -9.781326293945312, -9.449865341186523, -9.11840534210205, -8.786945343017578, -8.455485343933105, -8.124025344848633, -7.792564392089844, -7.461104393005371, -7.129644393920898, -6.798183917999268, -6.466723442077637, -6.135263442993164, -5.803803443908691, -5.4723429679870605, -5.14088249206543, -4.809422492980957, -4.477962493896484, -4.1465020179748535, -3.8150417804718018, -3.48358154296875, -3.1521213054656982, -2.8206610679626465, -2.4892008304595947, -2.157740592956543, -1.8262803554534912, -1.4948201179504395, -1.1633598804473877, -0.8318996429443359, -0.5004394054412842, -0.16897916793823242, 0.16248106956481934, 0.4939413070678711, 0.8254015445709229, 1.1568617820739746, 1.4883220195770264, 1.8197822570800781, 2.15124249458313, 2.4827027320861816, 2.8141629695892334, 3.145623207092285, 3.477083444595337, 3.8085436820983887, 4.1400041580200195, 4.471464157104492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 5.0, 8.0, 8.0, 12.0, 15.0, 15.0, 22.0, 24.0, 32.0, 39.0, 37.0, 34.0, 28.0, 46.0, 45.0, 35.0, 44.0, 51.0, 52.0, 42.0, 44.0, 46.0, 35.0, 31.0, 36.0, 35.0, 34.0, 23.0, 23.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.852600574493408, -3.736675262451172, -3.6207501888275146, -3.5048248767852783, -3.388899803161621, -3.2729744911193848, -3.1570494174957275, -3.041124105453491, -2.925199031829834, -2.8092737197875977, -2.6933486461639404, -2.577423334121704, -2.461498260498047, -2.3455729484558105, -2.2296478748321533, -2.113722562789917, -1.9977973699569702, -1.8818721771240234, -1.7659469842910767, -1.6500217914581299, -1.534096598625183, -1.4181714057922363, -1.30224609375, -1.1863210201263428, -1.0703957080841064, -0.9544705152511597, -0.8385453224182129, -0.7226201295852661, -0.6066949367523193, -0.4907696843147278, -0.374844491481781, -0.25891929864883423, -0.14299416542053223, -0.027068965137004852, 0.08885623514652252, 0.2047814428806305, 0.32070663571357727, 0.43663185834884644, 0.5525570511817932, 0.66848224401474, 0.7844074368476868, 0.9003326296806335, 1.016257882118225, 1.1321830749511719, 1.2481082677841187, 1.3640334606170654, 1.4799586534500122, 1.595883846282959, 1.7118090391159058, 1.8277342319488525, 1.9436594247817993, 2.059584617614746, 2.1755099296569824, 2.2914350032806396, 2.407360315322876, 2.523285388946533, 2.6392107009887695, 2.755136013031006, 2.871061086654663, 2.9869863986968994, 3.1029114723205566, 3.218836784362793, 3.33476185798645, 3.4506871700286865, 3.5666122436523438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 15.0, 12.0, 13.0, 25.0, 43.0, 79.0, 242.0, 928.0, 7104.0, 4179547.0, 5250.0, 702.0, 165.0, 54.0, 35.0, 23.0, 15.0, 7.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.5863037109375, -5.457763671875, -5.3292236328125, -5.20068359375, -5.0721435546875, -4.943603515625, -4.8150634765625, -4.6865234375, -4.5579833984375, -4.429443359375, -4.3009033203125, -4.17236328125, -4.0438232421875, -3.915283203125, -3.7867431640625, -3.658203125, -3.5296630859375, -3.401123046875, -3.2725830078125, -3.14404296875, -3.0155029296875, -2.886962890625, -2.7584228515625, -2.6298828125, -2.5013427734375, -2.372802734375, -2.2442626953125, -2.11572265625, -1.9871826171875, -1.858642578125, -1.7301025390625, -1.6015625, -1.4730224609375, -1.344482421875, -1.2159423828125, -1.08740234375, -0.9588623046875, -0.830322265625, -0.7017822265625, -0.5732421875, -0.4447021484375, -0.316162109375, -0.1876220703125, -0.05908203125, 0.0694580078125, 0.197998046875, 0.3265380859375, 0.455078125, 0.5836181640625, 0.712158203125, 0.8406982421875, 0.96923828125, 1.0977783203125, 1.226318359375, 1.3548583984375, 1.4833984375, 1.6119384765625, 1.740478515625, 1.8690185546875, 1.99755859375, 2.1260986328125, 2.254638671875, 2.3831787109375, 2.51171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 21.0, 72.0, 107.0, 191.0, 241.0, 168.0, 114.0, 39.0, 20.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7240219116210938, -0.7073211669921875, -0.6906204223632812, -0.673919677734375, -0.6572189331054688, -0.6405181884765625, -0.6238174438476562, -0.60711669921875, -0.5904159545898438, -0.5737152099609375, -0.5570144653320312, -0.540313720703125, -0.5236129760742188, -0.5069122314453125, -0.49021148681640625, -0.4735107421875, -0.45680999755859375, -0.4401092529296875, -0.42340850830078125, -0.406707763671875, -0.39000701904296875, -0.3733062744140625, -0.35660552978515625, -0.33990478515625, -0.32320404052734375, -0.3065032958984375, -0.28980255126953125, -0.273101806640625, -0.25640106201171875, -0.2397003173828125, -0.22299957275390625, -0.206298828125, -0.18959808349609375, -0.1728973388671875, -0.15619659423828125, -0.139495849609375, -0.12279510498046875, -0.1060943603515625, -0.08939361572265625, -0.07269287109375, -0.05599212646484375, -0.0392913818359375, -0.02259063720703125, -0.005889892578125, 0.01081085205078125, 0.0275115966796875, 0.04421234130859375, 0.0609130859375, 0.07761383056640625, 0.0943145751953125, 0.11101531982421875, 0.127716064453125, 0.14441680908203125, 0.1611175537109375, 0.17781829833984375, 0.19451904296875, 0.21121978759765625, 0.2279205322265625, 0.24462127685546875, 0.261322021484375, 0.27802276611328125, 0.2947235107421875, 0.31142425537109375, 0.328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 14.0, 14.0, 25.0, 56.0, 113.0, 243.0, 527.0, 1504.0, 5411.0, 39492.0, 4048861.0, 86290.0, 8116.0, 2161.0, 785.0, 316.0, 160.0, 77.0, 36.0, 36.0, 16.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.548828125, -1.5107040405273438, -1.4725799560546875, -1.4344558715820312, -1.396331787109375, -1.3582077026367188, -1.3200836181640625, -1.2819595336914062, -1.24383544921875, -1.2057113647460938, -1.1675872802734375, -1.1294631958007812, -1.091339111328125, -1.0532150268554688, -1.0150909423828125, -0.9769668579101562, -0.9388427734375, -0.9007186889648438, -0.8625946044921875, -0.8244705200195312, -0.786346435546875, -0.7482223510742188, -0.7100982666015625, -0.6719741821289062, -0.63385009765625, -0.5957260131835938, -0.5576019287109375, -0.5194778442382812, -0.481353759765625, -0.44322967529296875, -0.4051055908203125, -0.36698150634765625, -0.328857421875, -0.29073333740234375, -0.2526092529296875, -0.21448516845703125, -0.176361083984375, -0.13823699951171875, -0.1001129150390625, -0.06198883056640625, -0.02386474609375, 0.01425933837890625, 0.0523834228515625, 0.09050750732421875, 0.128631591796875, 0.16675567626953125, 0.2048797607421875, 0.24300384521484375, 0.2811279296875, 0.31925201416015625, 0.3573760986328125, 0.39550018310546875, 0.433624267578125, 0.47174835205078125, 0.5098724365234375, 0.5479965209960938, 0.58612060546875, 0.6242446899414062, 0.6623687744140625, 0.7004928588867188, 0.738616943359375, 0.7767410278320312, 0.8148651123046875, 0.8529891967773438, 0.89111328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 15.0, 27.0, 39.0, 72.0, 169.0, 767.0, 2625.0, 158.0, 58.0, 44.0, 28.0, 12.0, 10.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2922325134277344, -0.27904510498046875, -0.2658576965332031, -0.2526702880859375, -0.23948287963867188, -0.22629547119140625, -0.21310806274414062, -0.199920654296875, -0.18673324584960938, -0.17354583740234375, -0.16035842895507812, -0.1471710205078125, -0.13398361206054688, -0.12079620361328125, -0.10760879516601562, -0.09442138671875, -0.08123397827148438, -0.06804656982421875, -0.054859161376953125, -0.0416717529296875, -0.028484344482421875, -0.01529693603515625, -0.002109527587890625, 0.011077880859375, 0.024265289306640625, 0.03745269775390625, 0.050640106201171875, 0.0638275146484375, 0.07701492309570312, 0.09020233154296875, 0.10338973999023438, 0.1165771484375, 0.12976455688476562, 0.14295196533203125, 0.15613937377929688, 0.1693267822265625, 0.18251419067382812, 0.19570159912109375, 0.20888900756835938, 0.222076416015625, 0.23526382446289062, 0.24845123291015625, 0.2616386413574219, 0.2748260498046875, 0.2880134582519531, 0.30120086669921875, 0.3143882751464844, 0.32757568359375, 0.3407630920410156, 0.35395050048828125, 0.3671379089355469, 0.3803253173828125, 0.3935127258300781, 0.40670013427734375, 0.4198875427246094, 0.433074951171875, 0.4462623596191406, 0.45944976806640625, 0.4726371765136719, 0.4858245849609375, 0.4990119934082031, 0.5121994018554688, 0.5253868103027344, 0.53857421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 6.0, 26.0, 78.0, 232.0, 384.0, 176.0, 57.0, 23.0, 12.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.161806344985962, -3.0679574012756348, -2.9741084575653076, -2.8802595138549805, -2.786410331726074, -2.692561388015747, -2.59871244430542, -2.5048635005950928, -2.4110145568847656, -2.3171656131744385, -2.2233166694641113, -2.129467725753784, -2.035618782043457, -1.9417697191238403, -1.8479206562042236, -1.7540717124938965, -1.6602227687835693, -1.5663738250732422, -1.472524881362915, -1.3786758184432983, -1.2848268747329712, -1.190977931022644, -1.0971288681030273, -1.0032799243927002, -0.909430980682373, -0.8155820369720459, -0.721733033657074, -0.627884030342102, -0.5340350866317749, -0.44018611311912537, -0.34633713960647583, -0.2524881362915039, -0.15863895416259766, -0.06478998064994812, 0.029058992862701416, 0.12290796637535095, 0.2167569398880005, 0.31060591340065, 0.40445488691329956, 0.4983038902282715, 0.5921528339385986, 0.6860017776489258, 0.7798507809638977, 0.8736997842788696, 0.9675487279891968, 1.061397671699524, 1.1552467346191406, 1.2490956783294678, 1.342944622039795, 1.436793565750122, 1.5306425094604492, 1.624491572380066, 1.718340516090393, 1.8121894598007202, 1.906038522720337, 1.999887466430664, 2.093736410140991, 2.1875853538513184, 2.2814342975616455, 2.3752832412719727, 2.469132423400879, 2.562981367111206, 2.656830310821533, 2.7506792545318604, 2.8445281982421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 12.0, 16.0, 20.0, 37.0, 44.0, 61.0, 74.0, 59.0, 74.0, 70.0, 77.0, 96.0, 74.0, 62.0, 51.0, 28.0, 34.0, 38.0, 20.0, 11.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4109008312225342, -1.3583920001983643, -1.3058831691741943, -1.2533743381500244, -1.2008655071258545, -1.1483566761016846, -1.0958478450775146, -1.0433388948440552, -0.9908300638198853, -0.9383212327957153, -0.8858124017715454, -0.8333035707473755, -0.7807946801185608, -0.7282858490943909, -0.675777018070221, -0.6232681274414062, -0.5707593560218811, -0.5182505249977112, -0.46574166417121887, -0.41323283314704895, -0.36072397232055664, -0.3082151412963867, -0.2557063102722168, -0.2031974494457245, -0.15068861842155457, -0.09817977249622345, -0.04567093402147293, 0.006837904453277588, 0.059346750378608704, 0.11185559630393982, 0.16436442732810974, 0.21687328815460205, 0.269382119178772, 0.3218909502029419, 0.3743998110294342, 0.4269086420536041, 0.47941750288009644, 0.5319263339042664, 0.5844351649284363, 0.636944055557251, 0.6894528865814209, 0.7419617176055908, 0.7944705486297607, 0.8469793796539307, 0.8994882702827454, 0.9519971013069153, 1.0045058727264404, 1.0570148229599, 1.1095235347747803, 1.1620323657989502, 1.2145411968231201, 1.26705002784729, 1.31955885887146, 1.3720676898956299, 1.4245765209197998, 1.4770854711532593, 1.5295943021774292, 1.5821031332015991, 1.634611964225769, 1.687120795249939, 1.7396296262741089, 1.7921385765075684, 1.8446474075317383, 1.8971562385559082, 1.9496650695800781]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 24.0, 33.0, 61.0, 87.0, 174.0, 393.0, 874.0, 2919.0, 21923.0, 929899.0, 84672.0, 4977.0, 1420.0, 466.0, 227.0, 129.0, 72.0, 44.0, 36.0, 25.0, 14.0, 6.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.412109375, -2.342559814453125, -2.27301025390625, -2.203460693359375, -2.1339111328125, -2.064361572265625, -1.99481201171875, -1.925262451171875, -1.855712890625, -1.786163330078125, -1.71661376953125, -1.647064208984375, -1.5775146484375, -1.507965087890625, -1.43841552734375, -1.368865966796875, -1.29931640625, -1.229766845703125, -1.16021728515625, -1.090667724609375, -1.0211181640625, -0.951568603515625, -0.88201904296875, -0.812469482421875, -0.742919921875, -0.673370361328125, -0.60382080078125, -0.534271240234375, -0.4647216796875, -0.395172119140625, -0.32562255859375, -0.256072998046875, -0.1865234375, -0.116973876953125, -0.04742431640625, 0.022125244140625, 0.0916748046875, 0.161224365234375, 0.23077392578125, 0.300323486328125, 0.369873046875, 0.439422607421875, 0.50897216796875, 0.578521728515625, 0.6480712890625, 0.717620849609375, 0.78717041015625, 0.856719970703125, 0.92626953125, 0.995819091796875, 1.06536865234375, 1.134918212890625, 1.2044677734375, 1.274017333984375, 1.34356689453125, 1.413116455078125, 1.482666015625, 1.552215576171875, 1.62176513671875, 1.691314697265625, 1.7608642578125, 1.830413818359375, 1.89996337890625, 1.969512939453125, 2.0390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 15.0, 43.0, 98.0, 139.0, 213.0, 218.0, 147.0, 65.0, 33.0, 13.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6937675476074219, -0.6775741577148438, -0.6613807678222656, -0.6451873779296875, -0.6289939880371094, -0.6128005981445312, -0.5966072082519531, -0.580413818359375, -0.5642204284667969, -0.5480270385742188, -0.5318336486816406, -0.5156402587890625, -0.4994468688964844, -0.48325347900390625, -0.4670600891113281, -0.45086669921875, -0.4346733093261719, -0.41847991943359375, -0.4022865295410156, -0.3860931396484375, -0.3698997497558594, -0.35370635986328125, -0.3375129699707031, -0.321319580078125, -0.3051261901855469, -0.28893280029296875, -0.2727394104003906, -0.2565460205078125, -0.24035263061523438, -0.22415924072265625, -0.20796585083007812, -0.1917724609375, -0.17557907104492188, -0.15938568115234375, -0.14319229125976562, -0.1269989013671875, -0.11080551147460938, -0.09461212158203125, -0.07841873168945312, -0.062225341796875, -0.046031951904296875, -0.02983856201171875, -0.013645172119140625, 0.0025482177734375, 0.018741607666015625, 0.03493499755859375, 0.051128387451171875, 0.06732177734375, 0.08351516723632812, 0.09970855712890625, 0.11590194702148438, 0.1320953369140625, 0.14828872680664062, 0.16448211669921875, 0.18067550659179688, 0.196868896484375, 0.21306228637695312, 0.22925567626953125, 0.24544906616210938, 0.2616424560546875, 0.2778358459472656, 0.29402923583984375, 0.3102226257324219, 0.326416015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 5.0, 13.0, 7.0, 20.0, 24.0, 36.0, 53.0, 88.0, 130.0, 276.0, 756.0, 2182.0, 8570.0, 55370.0, 736635.0, 216026.0, 21710.0, 4267.0, 1322.0, 505.0, 217.0, 120.0, 62.0, 34.0, 26.0, 36.0, 18.0, 11.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4228515625, -1.3841552734375, -1.345458984375, -1.3067626953125, -1.26806640625, -1.2293701171875, -1.190673828125, -1.1519775390625, -1.11328125, -1.0745849609375, -1.035888671875, -0.9971923828125, -0.95849609375, -0.9197998046875, -0.881103515625, -0.8424072265625, -0.8037109375, -0.7650146484375, -0.726318359375, -0.6876220703125, -0.64892578125, -0.6102294921875, -0.571533203125, -0.5328369140625, -0.494140625, -0.4554443359375, -0.416748046875, -0.3780517578125, -0.33935546875, -0.3006591796875, -0.261962890625, -0.2232666015625, -0.1845703125, -0.1458740234375, -0.107177734375, -0.0684814453125, -0.02978515625, 0.0089111328125, 0.047607421875, 0.0863037109375, 0.125, 0.1636962890625, 0.202392578125, 0.2410888671875, 0.27978515625, 0.3184814453125, 0.357177734375, 0.3958740234375, 0.4345703125, 0.4732666015625, 0.511962890625, 0.5506591796875, 0.58935546875, 0.6280517578125, 0.666748046875, 0.7054443359375, 0.744140625, 0.7828369140625, 0.821533203125, 0.8602294921875, 0.89892578125, 0.9376220703125, 0.976318359375, 1.0150146484375, 1.0537109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 13.0, 23.0, 16.0, 23.0, 23.0, 21.0, 46.0, 49.0, 46.0, 51.0, 59.0, 84.0, 86.0, 54.0, 63.0, 65.0, 42.0, 37.0, 34.0, 27.0, 29.0, 21.0, 19.0, 13.0, 9.0, 8.0, 7.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7454910278320312, -0.7160797119140625, -0.6866683959960938, -0.657257080078125, -0.6278457641601562, -0.5984344482421875, -0.5690231323242188, -0.53961181640625, -0.5102005004882812, -0.4807891845703125, -0.45137786865234375, -0.421966552734375, -0.39255523681640625, -0.3631439208984375, -0.33373260498046875, -0.3043212890625, -0.27490997314453125, -0.2454986572265625, -0.21608734130859375, -0.186676025390625, -0.15726470947265625, -0.1278533935546875, -0.09844207763671875, -0.06903076171875, -0.03961944580078125, -0.0102081298828125, 0.01920318603515625, 0.048614501953125, 0.07802581787109375, 0.1074371337890625, 0.13684844970703125, 0.166259765625, 0.19567108154296875, 0.2250823974609375, 0.25449371337890625, 0.283905029296875, 0.31331634521484375, 0.3427276611328125, 0.37213897705078125, 0.40155029296875, 0.43096160888671875, 0.4603729248046875, 0.48978424072265625, 0.519195556640625, 0.5486068725585938, 0.5780181884765625, 0.6074295043945312, 0.6368408203125, 0.6662521362304688, 0.6956634521484375, 0.7250747680664062, 0.754486083984375, 0.7838973999023438, 0.8133087158203125, 0.8427200317382812, 0.87213134765625, 0.9015426635742188, 0.9309539794921875, 0.9603652954101562, 0.989776611328125, 1.0191879272460938, 1.0485992431640625, 1.0780105590820312, 1.107421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 10.0, 3.0, 6.0, 16.0, 19.0, 35.0, 67.0, 136.0, 278.0, 759.0, 2383.0, 11664.0, 123056.0, 851382.0, 49440.0, 6720.0, 1596.0, 521.0, 193.0, 86.0, 58.0, 29.0, 30.0, 14.0, 9.0, 6.0, 12.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.3255500793457031, -0.31516265869140625, -0.3047752380371094, -0.2943878173828125, -0.2840003967285156, -0.27361297607421875, -0.2632255554199219, -0.252838134765625, -0.24245071411132812, -0.23206329345703125, -0.22167587280273438, -0.2112884521484375, -0.20090103149414062, -0.19051361083984375, -0.18012619018554688, -0.16973876953125, -0.15935134887695312, -0.14896392822265625, -0.13857650756835938, -0.1281890869140625, -0.11780166625976562, -0.10741424560546875, -0.09702682495117188, -0.086639404296875, -0.07625198364257812, -0.06586456298828125, -0.055477142333984375, -0.0450897216796875, -0.034702301025390625, -0.02431488037109375, -0.013927459716796875, -0.0035400390625, 0.006847381591796875, 0.01723480224609375, 0.027622222900390625, 0.0380096435546875, 0.048397064208984375, 0.05878448486328125, 0.06917190551757812, 0.079559326171875, 0.08994674682617188, 0.10033416748046875, 0.11072158813476562, 0.1211090087890625, 0.13149642944335938, 0.14188385009765625, 0.15227127075195312, 0.16265869140625, 0.17304611206054688, 0.18343353271484375, 0.19382095336914062, 0.2042083740234375, 0.21459579467773438, 0.22498321533203125, 0.23537063598632812, 0.245758056640625, 0.2561454772949219, 0.26653289794921875, 0.2769203186035156, 0.2873077392578125, 0.2976951599121094, 0.30808258056640625, 0.3184700012207031, 0.328857421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 9.0, 8.0, 13.0, 20.0, 17.0, 28.0, 40.0, 47.0, 72.0, 112.0, 107.0, 144.0, 104.0, 87.0, 47.0, 32.0, 22.0, 26.0, 8.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6927719116210938e-05, -1.6219913959503174e-05, -1.551210880279541e-05, -1.4804303646087646e-05, -1.4096498489379883e-05, -1.3388693332672119e-05, -1.2680888175964355e-05, -1.1973083019256592e-05, -1.1265277862548828e-05, -1.0557472705841064e-05, -9.8496675491333e-06, -9.141862392425537e-06, -8.434057235717773e-06, -7.72625207901001e-06, -7.018446922302246e-06, -6.310641765594482e-06, -5.602836608886719e-06, -4.895031452178955e-06, -4.187226295471191e-06, -3.4794211387634277e-06, -2.771615982055664e-06, -2.0638108253479004e-06, -1.3560056686401367e-06, -6.48200511932373e-07, 5.960464477539063e-08, 7.674098014831543e-07, 1.475214958190918e-06, 2.1830201148986816e-06, 2.8908252716064453e-06, 3.598630428314209e-06, 4.306435585021973e-06, 5.014240741729736e-06, 5.7220458984375e-06, 6.429851055145264e-06, 7.137656211853027e-06, 7.845461368560791e-06, 8.553266525268555e-06, 9.261071681976318e-06, 9.968876838684082e-06, 1.0676681995391846e-05, 1.138448715209961e-05, 1.2092292308807373e-05, 1.2800097465515137e-05, 1.35079026222229e-05, 1.4215707778930664e-05, 1.4923512935638428e-05, 1.563131809234619e-05, 1.6339123249053955e-05, 1.704692840576172e-05, 1.7754733562469482e-05, 1.8462538719177246e-05, 1.917034387588501e-05, 1.9878149032592773e-05, 2.0585954189300537e-05, 2.12937593460083e-05, 2.2001564502716064e-05, 2.2709369659423828e-05, 2.3417174816131592e-05, 2.4124979972839355e-05, 2.483278512954712e-05, 2.5540590286254883e-05, 2.6248395442962646e-05, 2.695620059967041e-05, 2.7664005756378174e-05, 2.8371810913085938e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 7.0, 7.0, 12.0, 16.0, 26.0, 34.0, 86.0, 161.0, 396.0, 1402.0, 7958.0, 145647.0, 870567.0, 18483.0, 2622.0, 627.0, 240.0, 110.0, 53.0, 22.0, 14.0, 20.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3597412109375, -0.345458984375, -0.3311767578125, -0.31689453125, -0.3026123046875, -0.288330078125, -0.2740478515625, -0.259765625, -0.2454833984375, -0.231201171875, -0.2169189453125, -0.20263671875, -0.1883544921875, -0.174072265625, -0.1597900390625, -0.1455078125, -0.1312255859375, -0.116943359375, -0.1026611328125, -0.08837890625, -0.0740966796875, -0.059814453125, -0.0455322265625, -0.03125, -0.0169677734375, -0.002685546875, 0.0115966796875, 0.02587890625, 0.0401611328125, 0.054443359375, 0.0687255859375, 0.0830078125, 0.0972900390625, 0.111572265625, 0.1258544921875, 0.14013671875, 0.1544189453125, 0.168701171875, 0.1829833984375, 0.197265625, 0.2115478515625, 0.225830078125, 0.2401123046875, 0.25439453125, 0.2686767578125, 0.282958984375, 0.2972412109375, 0.3115234375, 0.3258056640625, 0.340087890625, 0.3543701171875, 0.36865234375, 0.3829345703125, 0.397216796875, 0.4114990234375, 0.42578125, 0.4400634765625, 0.454345703125, 0.4686279296875, 0.48291015625, 0.4971923828125, 0.511474609375, 0.5257568359375, 0.5400390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 7.0, 15.0, 16.0, 35.0, 45.0, 66.0, 110.0, 138.0, 149.0, 123.0, 66.0, 60.0, 34.0, 23.0, 15.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15757369995117188, -0.15157318115234375, -0.14557266235351562, -0.1395721435546875, -0.13357162475585938, -0.12757110595703125, -0.12157058715820312, -0.115570068359375, -0.10956954956054688, -0.10356903076171875, -0.09756851196289062, -0.0915679931640625, -0.08556747436523438, -0.07956695556640625, -0.07356643676757812, -0.06756591796875, -0.061565399169921875, -0.05556488037109375, -0.049564361572265625, -0.0435638427734375, -0.037563323974609375, -0.03156280517578125, -0.025562286376953125, -0.019561767578125, -0.013561248779296875, -0.00756072998046875, -0.001560211181640625, 0.0044403076171875, 0.010440826416015625, 0.01644134521484375, 0.022441864013671875, 0.0284423828125, 0.034442901611328125, 0.04044342041015625, 0.046443939208984375, 0.0524444580078125, 0.058444976806640625, 0.06444549560546875, 0.07044601440429688, 0.076446533203125, 0.08244705200195312, 0.08844757080078125, 0.09444808959960938, 0.1004486083984375, 0.10644912719726562, 0.11244964599609375, 0.11845016479492188, 0.12445068359375, 0.13045120239257812, 0.13645172119140625, 0.14245223999023438, 0.1484527587890625, 0.15445327758789062, 0.16045379638671875, 0.16645431518554688, 0.172454833984375, 0.17845535278320312, 0.18445587158203125, 0.19045639038085938, 0.1964569091796875, 0.20245742797851562, 0.20845794677734375, 0.21445846557617188, 0.220458984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 13.0, 65.0, 278.0, 451.0, 142.0, 39.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.783329010009766, -21.350446701049805, -20.917564392089844, -20.484683990478516, -20.051801681518555, -19.618919372558594, -19.186037063598633, -18.753154754638672, -18.320274353027344, -17.887392044067383, -17.454509735107422, -17.021629333496094, -16.588747024536133, -16.155864715576172, -15.722982406616211, -15.290101051330566, -14.857217788696289, -14.424335479736328, -13.991454124450684, -13.558571815490723, -13.125690460205078, -12.692808151245117, -12.259925842285156, -11.827044486999512, -11.394163131713867, -10.961280822753906, -10.528399467468262, -10.0955171585083, -9.662635803222656, -9.229753494262695, -8.796871185302734, -8.36398983001709, -7.931107997894287, -7.498226165771484, -7.065344333648682, -6.632462501525879, -6.199580192565918, -5.766698360443115, -5.3338165283203125, -4.900934219360352, -4.468052864074707, -4.035171031951904, -3.6022889614105225, -3.1694071292877197, -2.736525058746338, -2.303643226623535, -1.8707613945007324, -1.4378793239593506, -1.0049972534179688, -0.5721153020858765, -0.13923341035842896, 0.29364848136901855, 0.7265304327011108, 1.1594123840332031, 1.5922942161560059, 2.0251762866973877, 2.4580581188201904, 2.890939950942993, 3.323822021484375, 3.7567038536071777, 4.1895856857299805, 4.622467994689941, 5.055349349975586, 5.488231658935547, 5.92111349105835]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 3.0, 7.0, 9.0, 18.0, 9.0, 14.0, 24.0, 23.0, 34.0, 34.0, 30.0, 34.0, 31.0, 40.0, 36.0, 45.0, 34.0, 52.0, 42.0, 47.0, 34.0, 54.0, 32.0, 37.0, 43.0, 34.0, 34.0, 25.0, 28.0, 22.0, 13.0, 16.0, 13.0, 9.0, 17.0, 3.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.39192008972168, -4.265620231628418, -4.139319896697998, -4.013020038604736, -3.8867197036743164, -3.7604198455810547, -3.634119749069214, -3.507819652557373, -3.3815195560455322, -3.2552194595336914, -3.1289193630218506, -3.0026192665100098, -2.876319408416748, -2.750019073486328, -2.6237192153930664, -2.4974191188812256, -2.3711190223693848, -2.244818925857544, -2.118518829345703, -1.9922188520431519, -1.865918755531311, -1.7396186590194702, -1.613318681716919, -1.4870185852050781, -1.3607184886932373, -1.2344183921813965, -1.1081182956695557, -0.9818183183670044, -0.8555182218551636, -0.7292181253433228, -0.6029180884361267, -0.47661805152893066, -0.35031771659851074, -0.2240176498889923, -0.09771758317947388, 0.028582483530044556, 0.154882550239563, 0.2811826467514038, 0.40748268365859985, 0.5337827205657959, 0.6600828170776367, 0.7863829135894775, 0.9126829504966736, 1.0389829874038696, 1.1652830839157104, 1.2915831804275513, 1.4178831577301025, 1.5441832542419434, 1.6704833507537842, 1.796783447265625, 1.9230835437774658, 2.0493836402893066, 2.1756834983825684, 2.3019838333129883, 2.42828369140625, 2.554583787918091, 2.6808838844299316, 2.8071839809417725, 2.9334840774536133, 3.059784173965454, 3.186084270477295, 3.3123841285705566, 3.4386842250823975, 3.5649843215942383, 3.691284418106079]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 10.0, 26.0, 25.0, 31.0, 48.0, 67.0, 83.0, 141.0, 232.0, 415.0, 907.0, 2314.0, 8263.0, 67130.0, 4062687.0, 42200.0, 6460.0, 1863.0, 702.0, 288.0, 146.0, 80.0, 37.0, 32.0, 17.0, 9.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4609375, -1.42803955078125, -1.3951416015625, -1.36224365234375, -1.329345703125, -1.29644775390625, -1.2635498046875, -1.23065185546875, -1.19775390625, -1.16485595703125, -1.1319580078125, -1.09906005859375, -1.066162109375, -1.03326416015625, -1.0003662109375, -0.96746826171875, -0.9345703125, -0.90167236328125, -0.8687744140625, -0.83587646484375, -0.802978515625, -0.77008056640625, -0.7371826171875, -0.70428466796875, -0.67138671875, -0.63848876953125, -0.6055908203125, -0.57269287109375, -0.539794921875, -0.50689697265625, -0.4739990234375, -0.44110107421875, -0.408203125, -0.37530517578125, -0.3424072265625, -0.30950927734375, -0.276611328125, -0.24371337890625, -0.2108154296875, -0.17791748046875, -0.14501953125, -0.11212158203125, -0.0792236328125, -0.04632568359375, -0.013427734375, 0.01947021484375, 0.0523681640625, 0.08526611328125, 0.1181640625, 0.15106201171875, 0.1839599609375, 0.21685791015625, 0.249755859375, 0.28265380859375, 0.3155517578125, 0.34844970703125, 0.38134765625, 0.41424560546875, 0.4471435546875, 0.48004150390625, 0.512939453125, 0.54583740234375, 0.5787353515625, 0.61163330078125, 0.64453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 18.0, 41.0, 75.0, 127.0, 169.0, 184.0, 146.0, 116.0, 67.0, 24.0, 15.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7386932373046875, -0.722015380859375, -0.7053375244140625, -0.68865966796875, -0.6719818115234375, -0.655303955078125, -0.6386260986328125, -0.6219482421875, -0.6052703857421875, -0.588592529296875, -0.5719146728515625, -0.55523681640625, -0.5385589599609375, -0.521881103515625, -0.5052032470703125, -0.488525390625, -0.4718475341796875, -0.455169677734375, -0.4384918212890625, -0.42181396484375, -0.4051361083984375, -0.388458251953125, -0.3717803955078125, -0.3551025390625, -0.3384246826171875, -0.321746826171875, -0.3050689697265625, -0.28839111328125, -0.2717132568359375, -0.255035400390625, -0.2383575439453125, -0.2216796875, -0.2050018310546875, -0.188323974609375, -0.1716461181640625, -0.15496826171875, -0.1382904052734375, -0.121612548828125, -0.1049346923828125, -0.0882568359375, -0.0715789794921875, -0.054901123046875, -0.0382232666015625, -0.02154541015625, -0.0048675537109375, 0.011810302734375, 0.0284881591796875, 0.045166015625, 0.0618438720703125, 0.078521728515625, 0.0951995849609375, 0.11187744140625, 0.1285552978515625, 0.145233154296875, 0.1619110107421875, 0.1785888671875, 0.1952667236328125, 0.211944580078125, 0.2286224365234375, 0.24530029296875, 0.2619781494140625, 0.278656005859375, 0.2953338623046875, 0.31201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 7.0, 14.0, 23.0, 54.0, 120.0, 260.0, 666.0, 1587.0, 3657.0, 11130.0, 57778.0, 3978020.0, 115552.0, 16466.0, 5120.0, 2133.0, 926.0, 421.0, 176.0, 73.0, 29.0, 20.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96533203125, -0.9374618530273438, -0.9095916748046875, -0.8817214965820312, -0.853851318359375, -0.8259811401367188, -0.7981109619140625, -0.7702407836914062, -0.74237060546875, -0.7145004272460938, -0.6866302490234375, -0.6587600708007812, -0.630889892578125, -0.6030197143554688, -0.5751495361328125, -0.5472793579101562, -0.5194091796875, -0.49153900146484375, -0.4636688232421875, -0.43579864501953125, -0.407928466796875, -0.38005828857421875, -0.3521881103515625, -0.32431793212890625, -0.29644775390625, -0.26857757568359375, -0.2407073974609375, -0.21283721923828125, -0.184967041015625, -0.15709686279296875, -0.1292266845703125, -0.10135650634765625, -0.073486328125, -0.04561614990234375, -0.0177459716796875, 0.01012420654296875, 0.037994384765625, 0.06586456298828125, 0.0937347412109375, 0.12160491943359375, 0.14947509765625, 0.17734527587890625, 0.2052154541015625, 0.23308563232421875, 0.260955810546875, 0.28882598876953125, 0.3166961669921875, 0.34456634521484375, 0.3724365234375, 0.40030670166015625, 0.4281768798828125, 0.45604705810546875, 0.483917236328125, 0.5117874145507812, 0.5396575927734375, 0.5675277709960938, 0.59539794921875, 0.6232681274414062, 0.6511383056640625, 0.6790084838867188, 0.706878662109375, 0.7347488403320312, 0.7626190185546875, 0.7904891967773438, 0.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 14.0, 28.0, 16.0, 27.0, 64.0, 108.0, 302.0, 2960.0, 264.0, 93.0, 37.0, 29.0, 21.0, 15.0, 17.0, 11.0, 8.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24819183349609375, -0.2397918701171875, -0.23139190673828125, -0.222991943359375, -0.21459197998046875, -0.2061920166015625, -0.19779205322265625, -0.18939208984375, -0.18099212646484375, -0.1725921630859375, -0.16419219970703125, -0.155792236328125, -0.14739227294921875, -0.1389923095703125, -0.13059234619140625, -0.1221923828125, -0.11379241943359375, -0.1053924560546875, -0.09699249267578125, -0.088592529296875, -0.08019256591796875, -0.0717926025390625, -0.06339263916015625, -0.05499267578125, -0.04659271240234375, -0.0381927490234375, -0.02979278564453125, -0.021392822265625, -0.01299285888671875, -0.0045928955078125, 0.00380706787109375, 0.01220703125, 0.02060699462890625, 0.0290069580078125, 0.03740692138671875, 0.045806884765625, 0.05420684814453125, 0.0626068115234375, 0.07100677490234375, 0.07940673828125, 0.08780670166015625, 0.0962066650390625, 0.10460662841796875, 0.113006591796875, 0.12140655517578125, 0.1298065185546875, 0.13820648193359375, 0.1466064453125, 0.15500640869140625, 0.1634063720703125, 0.17180633544921875, 0.180206298828125, 0.18860626220703125, 0.1970062255859375, 0.20540618896484375, 0.21380615234375, 0.22220611572265625, 0.2306060791015625, 0.23900604248046875, 0.247406005859375, 0.25580596923828125, 0.2642059326171875, 0.27260589599609375, 0.281005859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 10.0, 18.0, 25.0, 78.0, 225.0, 342.0, 199.0, 72.0, 18.0, 8.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5095571279525757, -1.4336057901382446, -1.3576544523239136, -1.2817031145095825, -1.205751657485962, -1.1298003196716309, -1.0538489818572998, -0.9778976440429688, -0.9019463062286377, -0.8259949684143066, -0.7500436305999756, -0.6740922331809998, -0.5981408953666687, -0.5221895575523376, -0.4462381899356842, -0.37028682231903076, -0.2943354845046997, -0.21838413178920746, -0.1424327790737152, -0.06648142635822296, 0.009469926357269287, 0.08542126417160034, 0.16137263178825378, 0.23732399940490723, 0.3132753372192383, 0.38922667503356934, 0.4651780426502228, 0.5411294102668762, 0.6170807480812073, 0.6930320858955383, 0.7689834833145142, 0.8449348211288452, 0.9208860397338867, 0.9968373775482178, 1.0727887153625488, 1.1487400531768799, 1.224691390991211, 1.300642728805542, 1.3765941858291626, 1.4525455236434937, 1.5284968614578247, 1.6044481992721558, 1.6803995370864868, 1.7563508749008179, 1.8323023319244385, 1.9082536697387695, 1.9842050075531006, 2.0601563453674316, 2.1361076831817627, 2.2120590209960938, 2.288010358810425, 2.363961696624756, 2.439913034439087, 2.515864372253418, 2.591815710067749, 2.66776704788208, 2.7437186241149902, 2.8196699619293213, 2.8956212997436523, 2.9715726375579834, 3.0475239753723145, 3.1234753131866455, 3.1994266510009766, 3.2753782272338867, 3.3513293266296387]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 6.0, 8.0, 19.0, 19.0, 47.0, 40.0, 49.0, 59.0, 57.0, 65.0, 65.0, 90.0, 79.0, 64.0, 74.0, 59.0, 37.0, 45.0, 27.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.409222960472107, -1.3669484853744507, -1.3246738910675049, -1.2823994159698486, -1.2401249408721924, -1.1978504657745361, -1.1555758714675903, -1.113301396369934, -1.0710268020629883, -1.028752326965332, -0.986477792263031, -0.94420325756073, -0.9019287824630737, -0.8596542477607727, -0.8173797130584717, -0.7751052379608154, -0.7328307628631592, -0.6905562281608582, -0.6482817530632019, -0.6060072183609009, -0.5637327432632446, -0.5214582085609436, -0.4791836738586426, -0.43690916895866394, -0.3946346640586853, -0.35236015915870667, -0.310085654258728, -0.267811119556427, -0.22553661465644836, -0.18326210975646973, -0.1409875750541687, -0.09871307015419006, -0.05643868446350098, -0.014164172112941742, 0.028110340237617493, 0.07038486003875732, 0.11265936493873596, 0.1549338698387146, 0.19720840454101562, 0.23948290944099426, 0.2817574143409729, 0.32403191924095154, 0.3663064241409302, 0.4085809588432312, 0.45085546374320984, 0.4931299686431885, 0.5354045033454895, 0.5776790380477905, 0.6199535131454468, 0.6622280478477478, 0.704502522945404, 0.7467770576477051, 0.7890515327453613, 0.8313260674476624, 0.8736006021499634, 0.9158750772476196, 0.9581496119499207, 1.0004241466522217, 1.042698621749878, 1.0849730968475342, 1.12724769115448, 1.1695221662521362, 1.211796760559082, 1.2540712356567383, 1.2963457107543945]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 3.0, 7.0, 4.0, 9.0, 15.0, 19.0, 21.0, 23.0, 38.0, 55.0, 129.0, 259.0, 525.0, 1215.0, 4196.0, 42626.0, 887011.0, 102476.0, 6845.0, 1667.0, 660.0, 346.0, 156.0, 85.0, 48.0, 29.0, 28.0, 12.0, 13.0, 7.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.21417236328125, -2.1568603515625, -2.09954833984375, -2.042236328125, -1.98492431640625, -1.9276123046875, -1.87030029296875, -1.81298828125, -1.75567626953125, -1.6983642578125, -1.64105224609375, -1.583740234375, -1.52642822265625, -1.4691162109375, -1.41180419921875, -1.3544921875, -1.29718017578125, -1.2398681640625, -1.18255615234375, -1.125244140625, -1.06793212890625, -1.0106201171875, -0.95330810546875, -0.89599609375, -0.83868408203125, -0.7813720703125, -0.72406005859375, -0.666748046875, -0.60943603515625, -0.5521240234375, -0.49481201171875, -0.4375, -0.38018798828125, -0.3228759765625, -0.26556396484375, -0.208251953125, -0.15093994140625, -0.0936279296875, -0.03631591796875, 0.02099609375, 0.07830810546875, 0.1356201171875, 0.19293212890625, 0.250244140625, 0.30755615234375, 0.3648681640625, 0.42218017578125, 0.4794921875, 0.53680419921875, 0.5941162109375, 0.65142822265625, 0.708740234375, 0.76605224609375, 0.8233642578125, 0.88067626953125, 0.93798828125, 0.99530029296875, 1.0526123046875, 1.10992431640625, 1.167236328125, 1.22454833984375, 1.2818603515625, 1.33917236328125, 1.396484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 34.0, 58.0, 85.0, 165.0, 167.0, 160.0, 131.0, 91.0, 52.0, 21.0, 10.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73486328125, -0.7188224792480469, -0.7027816772460938, -0.6867408752441406, -0.6707000732421875, -0.6546592712402344, -0.6386184692382812, -0.6225776672363281, -0.606536865234375, -0.5904960632324219, -0.5744552612304688, -0.5584144592285156, -0.5423736572265625, -0.5263328552246094, -0.5102920532226562, -0.4942512512207031, -0.47821044921875, -0.4621696472167969, -0.44612884521484375, -0.4300880432128906, -0.4140472412109375, -0.3980064392089844, -0.38196563720703125, -0.3659248352050781, -0.349884033203125, -0.3338432312011719, -0.31780242919921875, -0.3017616271972656, -0.2857208251953125, -0.2696800231933594, -0.25363922119140625, -0.23759841918945312, -0.2215576171875, -0.20551681518554688, -0.18947601318359375, -0.17343521118164062, -0.1573944091796875, -0.14135360717773438, -0.12531280517578125, -0.10927200317382812, -0.093231201171875, -0.07719039916992188, -0.06114959716796875, -0.045108795166015625, -0.0290679931640625, -0.013027191162109375, 0.00301361083984375, 0.019054412841796875, 0.03509521484375, 0.051136016845703125, 0.06717681884765625, 0.08321762084960938, 0.0992584228515625, 0.11529922485351562, 0.13134002685546875, 0.14738082885742188, 0.163421630859375, 0.17946243286132812, 0.19550323486328125, 0.21154403686523438, 0.2275848388671875, 0.24362564086914062, 0.25966644287109375, 0.2757072448730469, 0.291748046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 19.0, 14.0, 12.0, 23.0, 29.0, 48.0, 64.0, 94.0, 194.0, 413.0, 1113.0, 3450.0, 13706.0, 87596.0, 759456.0, 154933.0, 20334.0, 4593.0, 1352.0, 516.0, 213.0, 108.0, 67.0, 45.0, 36.0, 22.0, 31.0, 11.0, 10.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0498046875, -1.01312255859375, -0.9764404296875, -0.93975830078125, -0.903076171875, -0.86639404296875, -0.8297119140625, -0.79302978515625, -0.75634765625, -0.71966552734375, -0.6829833984375, -0.64630126953125, -0.609619140625, -0.57293701171875, -0.5362548828125, -0.49957275390625, -0.462890625, -0.42620849609375, -0.3895263671875, -0.35284423828125, -0.316162109375, -0.27947998046875, -0.2427978515625, -0.20611572265625, -0.16943359375, -0.13275146484375, -0.0960693359375, -0.05938720703125, -0.022705078125, 0.01397705078125, 0.0506591796875, 0.08734130859375, 0.1240234375, 0.16070556640625, 0.1973876953125, 0.23406982421875, 0.270751953125, 0.30743408203125, 0.3441162109375, 0.38079833984375, 0.41748046875, 0.45416259765625, 0.4908447265625, 0.52752685546875, 0.564208984375, 0.60089111328125, 0.6375732421875, 0.67425537109375, 0.7109375, 0.74761962890625, 0.7843017578125, 0.82098388671875, 0.857666015625, 0.89434814453125, 0.9310302734375, 0.96771240234375, 1.00439453125, 1.04107666015625, 1.0777587890625, 1.11444091796875, 1.151123046875, 1.18780517578125, 1.2244873046875, 1.26116943359375, 1.2978515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 2.0, 9.0, 15.0, 24.0, 16.0, 28.0, 22.0, 27.0, 33.0, 45.0, 37.0, 55.0, 54.0, 51.0, 45.0, 56.0, 67.0, 61.0, 57.0, 52.0, 37.0, 31.0, 34.0, 27.0, 21.0, 13.0, 13.0, 9.0, 14.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.94091796875, -0.9139404296875, -0.886962890625, -0.8599853515625, -0.8330078125, -0.8060302734375, -0.779052734375, -0.7520751953125, -0.72509765625, -0.6981201171875, -0.671142578125, -0.6441650390625, -0.6171875, -0.5902099609375, -0.563232421875, -0.5362548828125, -0.50927734375, -0.4822998046875, -0.455322265625, -0.4283447265625, -0.4013671875, -0.3743896484375, -0.347412109375, -0.3204345703125, -0.29345703125, -0.2664794921875, -0.239501953125, -0.2125244140625, -0.185546875, -0.1585693359375, -0.131591796875, -0.1046142578125, -0.07763671875, -0.0506591796875, -0.023681640625, 0.0032958984375, 0.0302734375, 0.0572509765625, 0.084228515625, 0.1112060546875, 0.13818359375, 0.1651611328125, 0.192138671875, 0.2191162109375, 0.24609375, 0.2730712890625, 0.300048828125, 0.3270263671875, 0.35400390625, 0.3809814453125, 0.407958984375, 0.4349365234375, 0.4619140625, 0.4888916015625, 0.515869140625, 0.5428466796875, 0.56982421875, 0.5968017578125, 0.623779296875, 0.6507568359375, 0.677734375, 0.7047119140625, 0.731689453125, 0.7586669921875, 0.78564453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 12.0, 19.0, 23.0, 39.0, 55.0, 99.0, 188.0, 492.0, 2039.0, 13718.0, 441339.0, 571901.0, 15451.0, 2163.0, 553.0, 207.0, 99.0, 52.0, 40.0, 13.0, 7.0, 9.0, 6.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4485359191894531, -0.42905426025390625, -0.4095726013183594, -0.3900909423828125, -0.3706092834472656, -0.35112762451171875, -0.3316459655761719, -0.312164306640625, -0.2926826477050781, -0.27320098876953125, -0.2537193298339844, -0.2342376708984375, -0.21475601196289062, -0.19527435302734375, -0.17579269409179688, -0.15631103515625, -0.13682937622070312, -0.11734771728515625, -0.09786605834960938, -0.0783843994140625, -0.058902740478515625, -0.03942108154296875, -0.019939422607421875, -0.000457763671875, 0.019023895263671875, 0.03850555419921875, 0.057987213134765625, 0.0774688720703125, 0.09695053100585938, 0.11643218994140625, 0.13591384887695312, 0.1553955078125, 0.17487716674804688, 0.19435882568359375, 0.21384048461914062, 0.2333221435546875, 0.2528038024902344, 0.27228546142578125, 0.2917671203613281, 0.311248779296875, 0.3307304382324219, 0.35021209716796875, 0.3696937561035156, 0.3891754150390625, 0.4086570739746094, 0.42813873291015625, 0.4476203918457031, 0.46710205078125, 0.4865837097167969, 0.5060653686523438, 0.5255470275878906, 0.5450286865234375, 0.5645103454589844, 0.5839920043945312, 0.6034736633300781, 0.622955322265625, 0.6424369812011719, 0.6619186401367188, 0.6814002990722656, 0.7008819580078125, 0.7203636169433594, 0.7398452758789062, 0.7593269348144531, 0.77880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 13.0, 18.0, 24.0, 44.0, 131.0, 377.0, 217.0, 77.0, 38.0, 18.0, 17.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -2.9535964131355286e-05, -2.7004629373550415e-05, -2.4473294615745544e-05, -2.1941959857940674e-05, -1.9410625100135803e-05, -1.6879290342330933e-05, -1.4347955584526062e-05, -1.1816620826721191e-05, -9.28528606891632e-06, -6.75395131111145e-06, -4.22261655330658e-06, -1.691281795501709e-06, 8.400529623031616e-07, 3.3713877201080322e-06, 5.902722477912903e-06, 8.434057235717773e-06, 1.0965391993522644e-05, 1.3496726751327515e-05, 1.6028061509132385e-05, 1.8559396266937256e-05, 2.1090731024742126e-05, 2.3622065782546997e-05, 2.6153400540351868e-05, 2.8684735298156738e-05, 3.121607005596161e-05, 3.374740481376648e-05, 3.627873957157135e-05, 3.881007432937622e-05, 4.134140908718109e-05, 4.387274384498596e-05, 4.640407860279083e-05, 4.89354133605957e-05, 5.1466748118400574e-05, 5.3998082876205444e-05, 5.6529417634010315e-05, 5.9060752391815186e-05, 6.159208714962006e-05, 6.412342190742493e-05, 6.66547566652298e-05, 6.918609142303467e-05, 7.171742618083954e-05, 7.424876093864441e-05, 7.678009569644928e-05, 7.931143045425415e-05, 8.184276521205902e-05, 8.437409996986389e-05, 8.690543472766876e-05, 8.943676948547363e-05, 9.19681042432785e-05, 9.449943900108337e-05, 9.703077375888824e-05, 9.956210851669312e-05, 0.00010209344327449799, 0.00010462477803230286, 0.00010715611279010773, 0.0001096874475479126, 0.00011221878230571747, 0.00011475011706352234, 0.00011728145182132721, 0.00011981278657913208, 0.00012234412133693695, 0.00012487545609474182, 0.0001274067908525467, 0.00012993812561035156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 12.0, 28.0, 58.0, 93.0, 198.0, 616.0, 5950.0, 958701.0, 80393.0, 1902.0, 348.0, 125.0, 48.0, 43.0, 21.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.719329833984375, -0.68475341796875, -0.650177001953125, -0.6156005859375, -0.581024169921875, -0.54644775390625, -0.511871337890625, -0.477294921875, -0.442718505859375, -0.40814208984375, -0.373565673828125, -0.3389892578125, -0.304412841796875, -0.26983642578125, -0.235260009765625, -0.20068359375, -0.166107177734375, -0.13153076171875, -0.096954345703125, -0.0623779296875, -0.027801513671875, 0.00677490234375, 0.041351318359375, 0.075927734375, 0.110504150390625, 0.14508056640625, 0.179656982421875, 0.2142333984375, 0.248809814453125, 0.28338623046875, 0.317962646484375, 0.3525390625, 0.387115478515625, 0.42169189453125, 0.456268310546875, 0.4908447265625, 0.525421142578125, 0.55999755859375, 0.594573974609375, 0.629150390625, 0.663726806640625, 0.69830322265625, 0.732879638671875, 0.7674560546875, 0.802032470703125, 0.83660888671875, 0.871185302734375, 0.90576171875, 0.940338134765625, 0.97491455078125, 1.009490966796875, 1.0440673828125, 1.078643798828125, 1.11322021484375, 1.147796630859375, 1.182373046875, 1.216949462890625, 1.25152587890625, 1.286102294921875, 1.3206787109375, 1.355255126953125, 1.38983154296875, 1.424407958984375, 1.458984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 30.0, 54.0, 108.0, 241.0, 288.0, 148.0, 49.0, 20.0, 15.0, 13.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9326629638671875, -0.913665771484375, -0.8946685791015625, -0.87567138671875, -0.8566741943359375, -0.837677001953125, -0.8186798095703125, -0.7996826171875, -0.7806854248046875, -0.761688232421875, -0.7426910400390625, -0.72369384765625, -0.7046966552734375, -0.685699462890625, -0.6667022705078125, -0.647705078125, -0.6287078857421875, -0.609710693359375, -0.5907135009765625, -0.57171630859375, -0.5527191162109375, -0.533721923828125, -0.5147247314453125, -0.4957275390625, -0.4767303466796875, -0.457733154296875, -0.4387359619140625, -0.41973876953125, -0.4007415771484375, -0.381744384765625, -0.3627471923828125, -0.34375, -0.3247528076171875, -0.305755615234375, -0.2867584228515625, -0.26776123046875, -0.2487640380859375, -0.229766845703125, -0.2107696533203125, -0.1917724609375, -0.1727752685546875, -0.153778076171875, -0.1347808837890625, -0.11578369140625, -0.0967864990234375, -0.077789306640625, -0.0587921142578125, -0.039794921875, -0.0207977294921875, -0.001800537109375, 0.0171966552734375, 0.03619384765625, 0.0551910400390625, 0.074188232421875, 0.0931854248046875, 0.1121826171875, 0.1311798095703125, 0.150177001953125, 0.1691741943359375, 0.18817138671875, 0.2071685791015625, 0.226165771484375, 0.2451629638671875, 0.26416015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 49.0, 98.0, 268.0, 320.0, 139.0, 58.0, 28.0, 13.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.300485610961914, -12.002562522888184, -11.704639434814453, -11.406717300415039, -11.108794212341309, -10.810871124267578, -10.512948989868164, -10.215025901794434, -9.917102813720703, -9.619179725646973, -9.321256637573242, -9.023334503173828, -8.725411415100098, -8.427488327026367, -8.129566192626953, -7.831643104553223, -7.533720016479492, -7.235796928405762, -6.9378743171691895, -6.639951705932617, -6.342028617858887, -6.044105529785156, -5.746182918548584, -5.448260307312012, -5.150337219238281, -4.852414131164551, -4.5544915199279785, -4.256568908691406, -3.958645820617676, -3.6607229709625244, -3.362800121307373, -3.0648772716522217, -2.766953945159912, -2.4690310955047607, -2.1711082458496094, -1.873185396194458, -1.5752625465393066, -1.2773396968841553, -0.9794168472290039, -0.6814939975738525, -0.38357114791870117, -0.0856482982635498, 0.21227455139160156, 0.5101974010467529, 0.8081202507019043, 1.1060431003570557, 1.403965950012207, 1.7018887996673584, 1.9998116493225098, 2.297734498977661, 2.5956573486328125, 2.893580198287964, 3.1915030479431152, 3.4894258975982666, 3.787348747253418, 4.085271835327148, 4.383194446563721, 4.681117057800293, 4.979040145874023, 5.276963233947754, 5.574885845184326, 5.872808456420898, 6.170731544494629, 6.468654632568359, 6.766577243804932]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 6.0, 9.0, 15.0, 14.0, 4.0, 13.0, 12.0, 18.0, 23.0, 23.0, 21.0, 33.0, 23.0, 32.0, 44.0, 43.0, 37.0, 41.0, 34.0, 36.0, 37.0, 37.0, 39.0, 41.0, 38.0, 34.0, 33.0, 32.0, 29.0, 26.0, 38.0, 24.0, 12.0, 14.0, 18.0, 5.0, 11.0, 11.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060755968093872, -2.9560089111328125, -2.851261615753174, -2.7465145587921143, -2.6417675018310547, -2.537020206451416, -2.4322731494903564, -2.327526092529297, -2.222778797149658, -2.1180317401885986, -2.01328444480896, -1.9085373878479004, -1.8037902116775513, -1.6990430355072021, -1.5942959785461426, -1.4895488023757935, -1.3848016262054443, -1.2800544500350952, -1.175307273864746, -1.0705602169036865, -0.9658130407333374, -0.8610658645629883, -0.7563187479972839, -0.6515716314315796, -0.5468244552612305, -0.44207730889320374, -0.337330162525177, -0.23258301615715027, -0.12783586978912354, -0.023088693618774414, 0.08165842294692993, 0.18640553951263428, 0.2911524772644043, 0.39589962363243103, 0.5006467700004578, 0.6053938865661621, 0.7101410627365112, 0.8148882389068604, 0.9196353554725647, 1.024382472038269, 1.1291296482086182, 1.2338768243789673, 1.3386240005493164, 1.443371057510376, 1.548118233680725, 1.6528654098510742, 1.7576124668121338, 1.862359642982483, 1.967106819152832, 2.0718538761138916, 2.1766011714935303, 2.28134822845459, 2.3860955238342285, 2.490842580795288, 2.5955896377563477, 2.7003369331359863, 2.805083990097046, 2.9098310470581055, 3.014578342437744, 3.1193253993988037, 3.2240724563598633, 3.328819751739502, 3.4335668087005615, 3.538313865661621, 3.6430611610412598]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 7.0, 7.0, 11.0, 15.0, 10.0, 34.0, 48.0, 102.0, 205.0, 426.0, 1105.0, 4347.0, 75013.0, 4100315.0, 9852.0, 1778.0, 546.0, 229.0, 104.0, 44.0, 32.0, 13.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.0859375, -4.9781951904296875, -4.870452880859375, -4.7627105712890625, -4.65496826171875, -4.5472259521484375, -4.439483642578125, -4.3317413330078125, -4.2239990234375, -4.1162567138671875, -4.008514404296875, -3.9007720947265625, -3.79302978515625, -3.6852874755859375, -3.577545166015625, -3.4698028564453125, -3.362060546875, -3.2543182373046875, -3.146575927734375, -3.0388336181640625, -2.93109130859375, -2.8233489990234375, -2.715606689453125, -2.6078643798828125, -2.5001220703125, -2.3923797607421875, -2.284637451171875, -2.1768951416015625, -2.06915283203125, -1.9614105224609375, -1.853668212890625, -1.7459259033203125, -1.63818359375, -1.5304412841796875, -1.422698974609375, -1.3149566650390625, -1.20721435546875, -1.0994720458984375, -0.991729736328125, -0.8839874267578125, -0.7762451171875, -0.6685028076171875, -0.560760498046875, -0.4530181884765625, -0.34527587890625, -0.2375335693359375, -0.129791259765625, -0.0220489501953125, 0.085693359375, 0.1934356689453125, 0.301177978515625, 0.4089202880859375, 0.51666259765625, 0.6244049072265625, 0.732147216796875, 0.8398895263671875, 0.9476318359375, 1.0553741455078125, 1.163116455078125, 1.2708587646484375, 1.37860107421875, 1.4863433837890625, 1.594085693359375, 1.7018280029296875, 1.8095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 16.0, 26.0, 43.0, 79.0, 107.0, 144.0, 154.0, 133.0, 118.0, 85.0, 42.0, 24.0, 13.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.759765625, -0.7434196472167969, -0.7270736694335938, -0.7107276916503906, -0.6943817138671875, -0.6780357360839844, -0.6616897583007812, -0.6453437805175781, -0.628997802734375, -0.6126518249511719, -0.5963058471679688, -0.5799598693847656, -0.5636138916015625, -0.5472679138183594, -0.5309219360351562, -0.5145759582519531, -0.49822998046875, -0.4818840026855469, -0.46553802490234375, -0.4491920471191406, -0.4328460693359375, -0.4165000915527344, -0.40015411376953125, -0.3838081359863281, -0.367462158203125, -0.3511161804199219, -0.33477020263671875, -0.3184242248535156, -0.3020782470703125, -0.2857322692871094, -0.26938629150390625, -0.2530403137207031, -0.2366943359375, -0.22034835815429688, -0.20400238037109375, -0.18765640258789062, -0.1713104248046875, -0.15496444702148438, -0.13861846923828125, -0.12227249145507812, -0.105926513671875, -0.08958053588867188, -0.07323455810546875, -0.056888580322265625, -0.0405426025390625, -0.024196624755859375, -0.00785064697265625, 0.008495330810546875, 0.02484130859375, 0.041187286376953125, 0.05753326416015625, 0.07387924194335938, 0.0902252197265625, 0.10657119750976562, 0.12291717529296875, 0.13926315307617188, 0.155609130859375, 0.17195510864257812, 0.18830108642578125, 0.20464706420898438, 0.2209930419921875, 0.23733901977539062, 0.25368499755859375, 0.2700309753417969, 0.286376953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 5.0, 9.0, 18.0, 23.0, 35.0, 49.0, 98.0, 133.0, 209.0, 397.0, 695.0, 1558.0, 3836.0, 11837.0, 54698.0, 3874788.0, 208041.0, 25037.0, 7281.0, 2753.0, 1226.0, 582.0, 361.0, 217.0, 150.0, 96.0, 42.0, 42.0, 18.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.33203125, -1.2947845458984375, -1.257537841796875, -1.2202911376953125, -1.18304443359375, -1.1457977294921875, -1.108551025390625, -1.0713043212890625, -1.0340576171875, -0.9968109130859375, -0.959564208984375, -0.9223175048828125, -0.88507080078125, -0.8478240966796875, -0.810577392578125, -0.7733306884765625, -0.736083984375, -0.6988372802734375, -0.661590576171875, -0.6243438720703125, -0.58709716796875, -0.5498504638671875, -0.512603759765625, -0.4753570556640625, -0.4381103515625, -0.4008636474609375, -0.363616943359375, -0.3263702392578125, -0.28912353515625, -0.2518768310546875, -0.214630126953125, -0.1773834228515625, -0.14013671875, -0.1028900146484375, -0.065643310546875, -0.0283966064453125, 0.00885009765625, 0.0460968017578125, 0.083343505859375, 0.1205902099609375, 0.1578369140625, 0.1950836181640625, 0.232330322265625, 0.2695770263671875, 0.30682373046875, 0.3440704345703125, 0.381317138671875, 0.4185638427734375, 0.455810546875, 0.4930572509765625, 0.530303955078125, 0.5675506591796875, 0.60479736328125, 0.6420440673828125, 0.679290771484375, 0.7165374755859375, 0.7537841796875, 0.7910308837890625, 0.828277587890625, 0.8655242919921875, 0.90277099609375, 0.9400177001953125, 0.977264404296875, 1.0145111083984375, 1.0517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 19.0, 23.0, 33.0, 63.0, 123.0, 769.0, 2628.0, 153.0, 66.0, 48.0, 33.0, 18.0, 12.0, 14.0, 11.0, 8.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.34137725830078125, -0.3277740478515625, -0.31417083740234375, -0.300567626953125, -0.28696441650390625, -0.2733612060546875, -0.25975799560546875, -0.24615478515625, -0.23255157470703125, -0.2189483642578125, -0.20534515380859375, -0.191741943359375, -0.17813873291015625, -0.1645355224609375, -0.15093231201171875, -0.1373291015625, -0.12372589111328125, -0.1101226806640625, -0.09651947021484375, -0.082916259765625, -0.06931304931640625, -0.0557098388671875, -0.04210662841796875, -0.02850341796875, -0.01490020751953125, -0.0012969970703125, 0.01230621337890625, 0.025909423828125, 0.03951263427734375, 0.0531158447265625, 0.06671905517578125, 0.080322265625, 0.09392547607421875, 0.1075286865234375, 0.12113189697265625, 0.134735107421875, 0.14833831787109375, 0.1619415283203125, 0.17554473876953125, 0.18914794921875, 0.20275115966796875, 0.2163543701171875, 0.22995758056640625, 0.243560791015625, 0.25716400146484375, 0.2707672119140625, 0.28437042236328125, 0.2979736328125, 0.31157684326171875, 0.3251800537109375, 0.33878326416015625, 0.352386474609375, 0.36598968505859375, 0.3795928955078125, 0.39319610595703125, 0.40679931640625, 0.42040252685546875, 0.4340057373046875, 0.44760894775390625, 0.461212158203125, 0.47481536865234375, 0.4884185791015625, 0.5020217895507812, 0.515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 53.0, 248.0, 441.0, 164.0, 52.0, 24.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.920597076416016, -4.764099597930908, -4.607602596282959, -4.451105117797852, -4.294608116149902, -4.138110637664795, -3.9816133975982666, -3.8251161575317383, -3.66861891746521, -3.5121216773986816, -3.3556244373321533, -3.199127197265625, -3.0426297187805176, -2.8861327171325684, -2.729635238647461, -2.5731379985809326, -2.4166407585144043, -2.260143518447876, -2.1036462783813477, -1.9471489191055298, -1.7906516790390015, -1.6341544389724731, -1.4776570796966553, -1.321159839630127, -1.1646625995635986, -1.0081653594970703, -0.8516680598258972, -0.6951707601547241, -0.5386735200881958, -0.3821762800216675, -0.22567898035049438, -0.06918168067932129, 0.08731555938720703, 0.24381282925605774, 0.40031009912490845, 0.5568073987960815, 0.7133046388626099, 0.8698018789291382, 1.026299238204956, 1.1827964782714844, 1.3392937183380127, 1.495790958404541, 1.6522881984710693, 1.8087855577468872, 1.9652827978134155, 2.1217799186706543, 2.2782773971557617, 2.43477463722229, 2.5912718772888184, 2.7477691173553467, 2.904266357421875, 3.0607635974884033, 3.2172608375549316, 3.373758316040039, 3.5302555561065674, 3.6867527961730957, 3.843250036239624, 3.9997472763061523, 4.15624475479126, 4.312741756439209, 4.469239234924316, 4.625736236572266, 4.782233715057373, 4.9387311935424805, 5.09522819519043]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 15.0, 16.0, 22.0, 27.0, 49.0, 62.0, 70.0, 82.0, 85.0, 96.0, 81.0, 84.0, 78.0, 62.0, 47.0, 36.0, 40.0, 16.0, 14.0, 4.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9566502571105957, -1.8838406801223755, -1.8110312223434448, -1.7382216453552246, -1.665412187576294, -1.5926026105880737, -1.5197930335998535, -1.4469835758209229, -1.3741739988327026, -1.3013644218444824, -1.2285549640655518, -1.1557453870773315, -1.0829358100891113, -1.0101263523101807, -0.9373167753219604, -0.864507257938385, -0.7916977405548096, -0.7188882231712341, -0.6460787057876587, -0.5732691287994385, -0.500459611415863, -0.4276500940322876, -0.35484054684638977, -0.28203099966049194, -0.2092214822769165, -0.13641194999217987, -0.06360241770744324, 0.009207114577293396, 0.08201664686203003, 0.15482616424560547, 0.2276357114315033, 0.3004452586174011, 0.37325501441955566, 0.4460645318031311, 0.5188740491867065, 0.5916836261749268, 0.6644931435585022, 0.7373026609420776, 0.8101122379302979, 0.8829217553138733, 0.9557312726974487, 1.028540849685669, 1.1013503074645996, 1.1741598844528198, 1.24696946144104, 1.3197789192199707, 1.392588496208191, 1.4653980731964111, 1.5382075309753418, 1.611017107963562, 1.6838265657424927, 1.756636142730713, 1.8294456005096436, 1.9022551774978638, 1.975064754486084, 2.0478742122650146, 2.1206836700439453, 2.193493127822876, 2.2663028240203857, 2.3391122817993164, 2.411921739578247, 2.4847311973571777, 2.5575408935546875, 2.630350351333618, 2.703160047531128]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 9.0, 14.0, 20.0, 12.0, 22.0, 48.0, 50.0, 69.0, 102.0, 143.0, 369.0, 612.0, 1397.0, 3723.0, 14554.0, 80670.0, 683550.0, 222724.0, 29541.0, 6764.0, 2189.0, 865.0, 441.0, 237.0, 96.0, 94.0, 43.0, 51.0, 29.0, 25.0, 15.0, 10.0, 7.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.5573577880859375, -1.508270263671875, -1.4591827392578125, -1.41009521484375, -1.3610076904296875, -1.311920166015625, -1.2628326416015625, -1.2137451171875, -1.1646575927734375, -1.115570068359375, -1.0664825439453125, -1.01739501953125, -0.9683074951171875, -0.919219970703125, -0.8701324462890625, -0.821044921875, -0.7719573974609375, -0.722869873046875, -0.6737823486328125, -0.62469482421875, -0.5756072998046875, -0.526519775390625, -0.4774322509765625, -0.4283447265625, -0.3792572021484375, -0.330169677734375, -0.2810821533203125, -0.23199462890625, -0.1829071044921875, -0.133819580078125, -0.0847320556640625, -0.03564453125, 0.0134429931640625, 0.062530517578125, 0.1116180419921875, 0.16070556640625, 0.2097930908203125, 0.258880615234375, 0.3079681396484375, 0.3570556640625, 0.4061431884765625, 0.455230712890625, 0.5043182373046875, 0.55340576171875, 0.6024932861328125, 0.651580810546875, 0.7006683349609375, 0.749755859375, 0.7988433837890625, 0.847930908203125, 0.8970184326171875, 0.94610595703125, 0.9951934814453125, 1.044281005859375, 1.0933685302734375, 1.1424560546875, 1.1915435791015625, 1.240631103515625, 1.2897186279296875, 1.33880615234375, 1.3878936767578125, 1.436981201171875, 1.4860687255859375, 1.53515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 20.0, 20.0, 46.0, 80.0, 87.0, 129.0, 129.0, 133.0, 115.0, 95.0, 63.0, 31.0, 19.0, 13.0, 14.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.72998046875, -0.7140464782714844, -0.6981124877929688, -0.6821784973144531, -0.6662445068359375, -0.6503105163574219, -0.6343765258789062, -0.6184425354003906, -0.602508544921875, -0.5865745544433594, -0.5706405639648438, -0.5547065734863281, -0.5387725830078125, -0.5228385925292969, -0.5069046020507812, -0.4909706115722656, -0.47503662109375, -0.4591026306152344, -0.44316864013671875, -0.4272346496582031, -0.4113006591796875, -0.3953666687011719, -0.37943267822265625, -0.3634986877441406, -0.347564697265625, -0.3316307067871094, -0.31569671630859375, -0.2997627258300781, -0.2838287353515625, -0.2678947448730469, -0.25196075439453125, -0.23602676391601562, -0.2200927734375, -0.20415878295898438, -0.18822479248046875, -0.17229080200195312, -0.1563568115234375, -0.14042282104492188, -0.12448883056640625, -0.10855484008789062, -0.092620849609375, -0.07668685913085938, -0.06075286865234375, -0.044818878173828125, -0.0288848876953125, -0.012950897216796875, 0.00298309326171875, 0.018917083740234375, 0.03485107421875, 0.050785064697265625, 0.06671905517578125, 0.08265304565429688, 0.0985870361328125, 0.11452102661132812, 0.13045501708984375, 0.14638900756835938, 0.162322998046875, 0.17825698852539062, 0.19419097900390625, 0.21012496948242188, 0.2260589599609375, 0.24199295043945312, 0.25792694091796875, 0.2738609313964844, 0.289794921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 14.0, 13.0, 21.0, 25.0, 39.0, 55.0, 81.0, 140.0, 228.0, 427.0, 776.0, 1597.0, 3513.0, 9316.0, 30409.0, 141664.0, 665351.0, 146531.0, 31341.0, 9604.0, 3676.0, 1705.0, 826.0, 463.0, 278.0, 166.0, 89.0, 58.0, 53.0, 23.0, 18.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1819610595703125, -1.143218994140625, -1.1044769287109375, -1.06573486328125, -1.0269927978515625, -0.988250732421875, -0.9495086669921875, -0.9107666015625, -0.8720245361328125, -0.833282470703125, -0.7945404052734375, -0.75579833984375, -0.7170562744140625, -0.678314208984375, -0.6395721435546875, -0.600830078125, -0.5620880126953125, -0.523345947265625, -0.4846038818359375, -0.44586181640625, -0.4071197509765625, -0.368377685546875, -0.3296356201171875, -0.2908935546875, -0.2521514892578125, -0.213409423828125, -0.1746673583984375, -0.13592529296875, -0.0971832275390625, -0.058441162109375, -0.0196990966796875, 0.01904296875, 0.0577850341796875, 0.096527099609375, 0.1352691650390625, 0.17401123046875, 0.2127532958984375, 0.251495361328125, 0.2902374267578125, 0.3289794921875, 0.3677215576171875, 0.406463623046875, 0.4452056884765625, 0.48394775390625, 0.5226898193359375, 0.561431884765625, 0.6001739501953125, 0.638916015625, 0.6776580810546875, 0.716400146484375, 0.7551422119140625, 0.79388427734375, 0.8326263427734375, 0.871368408203125, 0.9101104736328125, 0.9488525390625, 0.9875946044921875, 1.026336669921875, 1.0650787353515625, 1.10382080078125, 1.1425628662109375, 1.181304931640625, 1.2200469970703125, 1.2587890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 7.0, 12.0, 16.0, 21.0, 30.0, 40.0, 39.0, 44.0, 59.0, 60.0, 57.0, 70.0, 71.0, 85.0, 71.0, 63.0, 47.0, 46.0, 29.0, 27.0, 25.0, 16.0, 7.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4111785888671875, -1.362396240234375, -1.3136138916015625, -1.26483154296875, -1.2160491943359375, -1.167266845703125, -1.1184844970703125, -1.0697021484375, -1.0209197998046875, -0.972137451171875, -0.9233551025390625, -0.87457275390625, -0.8257904052734375, -0.777008056640625, -0.7282257080078125, -0.679443359375, -0.6306610107421875, -0.581878662109375, -0.5330963134765625, -0.48431396484375, -0.4355316162109375, -0.386749267578125, -0.3379669189453125, -0.2891845703125, -0.2404022216796875, -0.191619873046875, -0.1428375244140625, -0.09405517578125, -0.0452728271484375, 0.003509521484375, 0.0522918701171875, 0.10107421875, 0.1498565673828125, 0.198638916015625, 0.2474212646484375, 0.29620361328125, 0.3449859619140625, 0.393768310546875, 0.4425506591796875, 0.4913330078125, 0.5401153564453125, 0.588897705078125, 0.6376800537109375, 0.68646240234375, 0.7352447509765625, 0.784027099609375, 0.8328094482421875, 0.881591796875, 0.9303741455078125, 0.979156494140625, 1.0279388427734375, 1.07672119140625, 1.1255035400390625, 1.174285888671875, 1.2230682373046875, 1.2718505859375, 1.3206329345703125, 1.369415283203125, 1.4181976318359375, 1.46697998046875, 1.5157623291015625, 1.564544677734375, 1.6133270263671875, 1.662109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 11.0, 10.0, 17.0, 39.0, 62.0, 110.0, 177.0, 329.0, 598.0, 1177.0, 2503.0, 6954.0, 28276.0, 647902.0, 328059.0, 21957.0, 5847.0, 2275.0, 1039.0, 524.0, 285.0, 154.0, 100.0, 53.0, 24.0, 15.0, 18.0, 5.0, 2.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9147567749023438, -0.8851776123046875, -0.8555984497070312, -0.826019287109375, -0.7964401245117188, -0.7668609619140625, -0.7372817993164062, -0.70770263671875, -0.6781234741210938, -0.6485443115234375, -0.6189651489257812, -0.589385986328125, -0.5598068237304688, -0.5302276611328125, -0.5006484985351562, -0.4710693359375, -0.44149017333984375, -0.4119110107421875, -0.38233184814453125, -0.352752685546875, -0.32317352294921875, -0.2935943603515625, -0.26401519775390625, -0.23443603515625, -0.20485687255859375, -0.1752777099609375, -0.14569854736328125, -0.116119384765625, -0.08654022216796875, -0.0569610595703125, -0.02738189697265625, 0.002197265625, 0.03177642822265625, 0.0613555908203125, 0.09093475341796875, 0.120513916015625, 0.15009307861328125, 0.1796722412109375, 0.20925140380859375, 0.23883056640625, 0.26840972900390625, 0.2979888916015625, 0.32756805419921875, 0.357147216796875, 0.38672637939453125, 0.4163055419921875, 0.44588470458984375, 0.4754638671875, 0.5050430297851562, 0.5346221923828125, 0.5642013549804688, 0.593780517578125, 0.6233596801757812, 0.6529388427734375, 0.6825180053710938, 0.71209716796875, 0.7416763305664062, 0.7712554931640625, 0.8008346557617188, 0.830413818359375, 0.8599929809570312, 0.8895721435546875, 0.9191513061523438, 0.94873046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 11.0, 21.0, 28.0, 30.0, 65.0, 98.0, 138.0, 190.0, 136.0, 99.0, 41.0, 28.0, 22.0, 13.0, 14.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.052587509155273e-05, -7.837172597646713e-05, -7.621757686138153e-05, -7.406342774629593e-05, -7.190927863121033e-05, -6.975512951612473e-05, -6.760098040103912e-05, -6.544683128595352e-05, -6.329268217086792e-05, -6.113853305578232e-05, -5.8984383940696716e-05, -5.6830234825611115e-05, -5.467608571052551e-05, -5.252193659543991e-05, -5.036778748035431e-05, -4.821363836526871e-05, -4.6059489250183105e-05, -4.3905340135097504e-05, -4.17511910200119e-05, -3.95970419049263e-05, -3.74428927898407e-05, -3.5288743674755096e-05, -3.3134594559669495e-05, -3.098044544458389e-05, -2.882629632949829e-05, -2.667214721441269e-05, -2.4517998099327087e-05, -2.2363848984241486e-05, -2.0209699869155884e-05, -1.8055550754070282e-05, -1.590140163898468e-05, -1.3747252523899078e-05, -1.1593103408813477e-05, -9.438954293727875e-06, -7.284805178642273e-06, -5.130656063556671e-06, -2.9765069484710693e-06, -8.223578333854675e-07, 1.3317912817001343e-06, 3.485940396785736e-06, 5.640089511871338e-06, 7.79423862695694e-06, 9.948387742042542e-06, 1.2102536857128143e-05, 1.4256685972213745e-05, 1.6410835087299347e-05, 1.856498420238495e-05, 2.071913331747055e-05, 2.2873282432556152e-05, 2.5027431547641754e-05, 2.7181580662727356e-05, 2.9335729777812958e-05, 3.148987889289856e-05, 3.364402800798416e-05, 3.579817712306976e-05, 3.7952326238155365e-05, 4.010647535324097e-05, 4.226062446832657e-05, 4.441477358341217e-05, 4.656892269849777e-05, 4.8723071813583374e-05, 5.0877220928668976e-05, 5.303137004375458e-05, 5.518551915884018e-05, 5.733966827392578e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 13.0, 24.0, 43.0, 77.0, 193.0, 522.0, 1807.0, 9182.0, 739834.0, 287583.0, 7055.0, 1444.0, 440.0, 149.0, 73.0, 33.0, 22.0, 17.0, 9.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.707489013671875, -1.65716552734375, -1.606842041015625, -1.5565185546875, -1.506195068359375, -1.45587158203125, -1.405548095703125, -1.355224609375, -1.304901123046875, -1.25457763671875, -1.204254150390625, -1.1539306640625, -1.103607177734375, -1.05328369140625, -1.002960205078125, -0.95263671875, -0.902313232421875, -0.85198974609375, -0.801666259765625, -0.7513427734375, -0.701019287109375, -0.65069580078125, -0.600372314453125, -0.550048828125, -0.499725341796875, -0.44940185546875, -0.399078369140625, -0.3487548828125, -0.298431396484375, -0.24810791015625, -0.197784423828125, -0.1474609375, -0.097137451171875, -0.04681396484375, 0.003509521484375, 0.0538330078125, 0.104156494140625, 0.15447998046875, 0.204803466796875, 0.255126953125, 0.305450439453125, 0.35577392578125, 0.406097412109375, 0.4564208984375, 0.506744384765625, 0.55706787109375, 0.607391357421875, 0.65771484375, 0.708038330078125, 0.75836181640625, 0.808685302734375, 0.8590087890625, 0.909332275390625, 0.95965576171875, 1.009979248046875, 1.060302734375, 1.110626220703125, 1.16094970703125, 1.211273193359375, 1.2615966796875, 1.311920166015625, 1.36224365234375, 1.412567138671875, 1.462890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 4.0, 12.0, 19.0, 28.0, 39.0, 64.0, 112.0, 155.0, 180.0, 134.0, 88.0, 45.0, 22.0, 21.0, 21.0, 9.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85693359375, -0.8319168090820312, -0.8069000244140625, -0.7818832397460938, -0.756866455078125, -0.7318496704101562, -0.7068328857421875, -0.6818161010742188, -0.65679931640625, -0.6317825317382812, -0.6067657470703125, -0.5817489624023438, -0.556732177734375, -0.5317153930664062, -0.5066986083984375, -0.48168182373046875, -0.4566650390625, -0.43164825439453125, -0.4066314697265625, -0.38161468505859375, -0.356597900390625, -0.33158111572265625, -0.3065643310546875, -0.28154754638671875, -0.25653076171875, -0.23151397705078125, -0.2064971923828125, -0.18148040771484375, -0.156463623046875, -0.13144683837890625, -0.1064300537109375, -0.08141326904296875, -0.056396484375, -0.03137969970703125, -0.0063629150390625, 0.01865386962890625, 0.043670654296875, 0.06868743896484375, 0.0937042236328125, 0.11872100830078125, 0.14373779296875, 0.16875457763671875, 0.1937713623046875, 0.21878814697265625, 0.243804931640625, 0.26882171630859375, 0.2938385009765625, 0.31885528564453125, 0.3438720703125, 0.36888885498046875, 0.3939056396484375, 0.41892242431640625, 0.443939208984375, 0.46895599365234375, 0.4939727783203125, 0.5189895629882812, 0.54400634765625, 0.5690231323242188, 0.5940399169921875, 0.6190567016601562, 0.644073486328125, 0.6690902709960938, 0.6941070556640625, 0.7191238403320312, 0.744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 41.0, 99.0, 383.0, 328.0, 86.0, 35.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.99549865722656, -43.13209915161133, -42.268699645996094, -41.405303955078125, -40.54190444946289, -39.678504943847656, -38.81510543823242, -37.95170593261719, -37.08831024169922, -36.224910736083984, -35.36151123046875, -34.49811553955078, -33.63471603393555, -32.77131652832031, -31.907917022705078, -31.044519424438477, -30.181119918823242, -29.317720413208008, -28.454322814941406, -27.590923309326172, -26.72752571105957, -25.864126205444336, -25.000728607177734, -24.1373291015625, -23.273929595947266, -22.41053009033203, -21.54713249206543, -20.683732986450195, -19.820335388183594, -18.95693588256836, -18.093536376953125, -17.230138778686523, -16.366741180419922, -15.503342628479004, -14.639944076538086, -13.776544570922852, -12.91314697265625, -12.049747467041016, -11.186348915100098, -10.32295036315918, -9.459550857543945, -8.596152305603027, -7.732753753662109, -6.869354724884033, -6.005956172943115, -5.142557621002197, -4.279158592224121, -3.415760040283203, -2.552361488342285, -1.6889628171920776, -0.8255641460418701, 0.03783464431762695, 0.9012331962585449, 1.764631748199463, 2.628030776977539, 3.491429328918457, 4.354827880859375, 5.218226432800293, 6.081624984741211, 6.945024013519287, 7.808422565460205, 8.671821594238281, 9.5352201461792, 10.398618698120117, 11.262017250061035]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 8.0, 11.0, 18.0, 26.0, 13.0, 14.0, 30.0, 21.0, 30.0, 38.0, 34.0, 40.0, 34.0, 42.0, 45.0, 36.0, 48.0, 34.0, 31.0, 41.0, 37.0, 42.0, 39.0, 32.0, 31.0, 25.0, 26.0, 31.0, 23.0, 17.0, 17.0, 14.0, 10.0, 10.0, 10.0, 1.0, 7.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.0648722648620605, -6.840939998626709, -6.617007255554199, -6.393074989318848, -6.169142723083496, -5.9452104568481445, -5.721277713775635, -5.497345447540283, -5.273412704467773, -5.049480438232422, -4.825547695159912, -4.6016154289245605, -4.377683162689209, -4.153750419616699, -3.9298181533813477, -3.705885887145996, -3.4819536209106445, -3.258021116256714, -3.0340888500213623, -2.8101563453674316, -2.58622407913208, -2.3622915744781494, -2.1383590698242188, -1.9144266843795776, -1.6904942989349365, -1.4665619134902954, -1.2426295280456543, -1.0186970233917236, -0.7947646379470825, -0.5708322525024414, -0.34689974784851074, -0.12296736240386963, 0.10096454620361328, 0.3248969614505768, 0.5488293766975403, 0.7727618217468262, 0.9966942071914673, 1.2206265926361084, 1.444559097290039, 1.6684914827346802, 1.8924238681793213, 2.116356372833252, 2.3402886390686035, 2.564221143722534, 2.788153648376465, 3.0120859146118164, 3.236018419265747, 3.4599509239196777, 3.6838831901550293, 3.90781569480896, 4.131748199462891, 4.355680465698242, 4.579612731933594, 4.803544998168945, 5.027477741241455, 5.251410007476807, 5.475342750549316, 5.699275016784668, 5.923207759857178, 6.147140026092529, 6.371072292327881, 6.595005035400391, 6.818937301635742, 7.042869567871094, 7.266801834106445]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 11.0, 20.0, 18.0, 24.0, 35.0, 51.0, 67.0, 139.0, 242.0, 502.0, 1150.0, 2639.0, 7669.0, 39533.0, 3961892.0, 156422.0, 16643.0, 4222.0, 1574.0, 714.0, 317.0, 178.0, 83.0, 48.0, 28.0, 12.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.640625, -3.561065673828125, -3.48150634765625, -3.401947021484375, -3.3223876953125, -3.242828369140625, -3.16326904296875, -3.083709716796875, -3.004150390625, -2.924591064453125, -2.84503173828125, -2.765472412109375, -2.6859130859375, -2.606353759765625, -2.52679443359375, -2.447235107421875, -2.36767578125, -2.288116455078125, -2.20855712890625, -2.128997802734375, -2.0494384765625, -1.969879150390625, -1.89031982421875, -1.810760498046875, -1.731201171875, -1.651641845703125, -1.57208251953125, -1.492523193359375, -1.4129638671875, -1.333404541015625, -1.25384521484375, -1.174285888671875, -1.0947265625, -1.015167236328125, -0.93560791015625, -0.856048583984375, -0.7764892578125, -0.696929931640625, -0.61737060546875, -0.537811279296875, -0.458251953125, -0.378692626953125, -0.29913330078125, -0.219573974609375, -0.1400146484375, -0.060455322265625, 0.01910400390625, 0.098663330078125, 0.17822265625, 0.257781982421875, 0.33734130859375, 0.416900634765625, 0.4964599609375, 0.576019287109375, 0.65557861328125, 0.735137939453125, 0.814697265625, 0.894256591796875, 0.97381591796875, 1.053375244140625, 1.1329345703125, 1.212493896484375, 1.29205322265625, 1.371612548828125, 1.451171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 14.0, 23.0, 51.0, 64.0, 67.0, 70.0, 98.0, 88.0, 102.0, 108.0, 94.0, 61.0, 60.0, 27.0, 29.0, 17.0, 11.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7958984375, -0.7785758972167969, -0.7612533569335938, -0.7439308166503906, -0.7266082763671875, -0.7092857360839844, -0.6919631958007812, -0.6746406555175781, -0.657318115234375, -0.6399955749511719, -0.6226730346679688, -0.6053504943847656, -0.5880279541015625, -0.5707054138183594, -0.5533828735351562, -0.5360603332519531, -0.51873779296875, -0.5014152526855469, -0.48409271240234375, -0.4667701721191406, -0.4494476318359375, -0.4321250915527344, -0.41480255126953125, -0.3974800109863281, -0.380157470703125, -0.3628349304199219, -0.34551239013671875, -0.3281898498535156, -0.3108673095703125, -0.2935447692871094, -0.27622222900390625, -0.2588996887207031, -0.2415771484375, -0.22425460815429688, -0.20693206787109375, -0.18960952758789062, -0.1722869873046875, -0.15496444702148438, -0.13764190673828125, -0.12031936645507812, -0.102996826171875, -0.08567428588867188, -0.06835174560546875, -0.051029205322265625, -0.0337066650390625, -0.016384124755859375, 0.00093841552734375, 0.018260955810546875, 0.03558349609375, 0.052906036376953125, 0.07022857666015625, 0.08755111694335938, 0.1048736572265625, 0.12219619750976562, 0.13951873779296875, 0.15684127807617188, 0.174163818359375, 0.19148635864257812, 0.20880889892578125, 0.22613143920898438, 0.2434539794921875, 0.2607765197753906, 0.27809906005859375, 0.2954216003417969, 0.312744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 15.0, 19.0, 19.0, 31.0, 51.0, 80.0, 133.0, 167.0, 271.0, 407.0, 686.0, 1134.0, 2009.0, 3732.0, 7749.0, 18883.0, 67658.0, 2933291.0, 1060787.0, 62977.0, 18255.0, 7378.0, 3512.0, 1960.0, 1102.0, 700.0, 424.0, 275.0, 181.0, 125.0, 84.0, 50.0, 38.0, 26.0, 16.0, 10.0, 10.0, 8.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.4951171875, -1.454681396484375, -1.41424560546875, -1.373809814453125, -1.3333740234375, -1.292938232421875, -1.25250244140625, -1.212066650390625, -1.171630859375, -1.131195068359375, -1.09075927734375, -1.050323486328125, -1.0098876953125, -0.969451904296875, -0.92901611328125, -0.888580322265625, -0.84814453125, -0.807708740234375, -0.76727294921875, -0.726837158203125, -0.6864013671875, -0.645965576171875, -0.60552978515625, -0.565093994140625, -0.524658203125, -0.484222412109375, -0.44378662109375, -0.403350830078125, -0.3629150390625, -0.322479248046875, -0.28204345703125, -0.241607666015625, -0.201171875, -0.160736083984375, -0.12030029296875, -0.079864501953125, -0.0394287109375, 0.001007080078125, 0.04144287109375, 0.081878662109375, 0.122314453125, 0.162750244140625, 0.20318603515625, 0.243621826171875, 0.2840576171875, 0.324493408203125, 0.36492919921875, 0.405364990234375, 0.44580078125, 0.486236572265625, 0.52667236328125, 0.567108154296875, 0.6075439453125, 0.647979736328125, 0.68841552734375, 0.728851318359375, 0.769287109375, 0.809722900390625, 0.85015869140625, 0.890594482421875, 0.9310302734375, 0.971466064453125, 1.01190185546875, 1.052337646484375, 1.0927734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 9.0, 5.0, 15.0, 15.0, 31.0, 62.0, 83.0, 162.0, 2696.0, 532.0, 169.0, 87.0, 60.0, 27.0, 18.0, 24.0, 13.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6350479125976562, -0.6104278564453125, -0.5858078002929688, -0.561187744140625, -0.5365676879882812, -0.5119476318359375, -0.48732757568359375, -0.46270751953125, -0.43808746337890625, -0.4134674072265625, -0.38884735107421875, -0.364227294921875, -0.33960723876953125, -0.3149871826171875, -0.29036712646484375, -0.2657470703125, -0.24112701416015625, -0.2165069580078125, -0.19188690185546875, -0.167266845703125, -0.14264678955078125, -0.1180267333984375, -0.09340667724609375, -0.06878662109375, -0.04416656494140625, -0.0195465087890625, 0.00507354736328125, 0.029693603515625, 0.05431365966796875, 0.0789337158203125, 0.10355377197265625, 0.128173828125, 0.15279388427734375, 0.1774139404296875, 0.20203399658203125, 0.226654052734375, 0.25127410888671875, 0.2758941650390625, 0.30051422119140625, 0.32513427734375, 0.34975433349609375, 0.3743743896484375, 0.39899444580078125, 0.423614501953125, 0.44823455810546875, 0.4728546142578125, 0.49747467041015625, 0.5220947265625, 0.5467147827148438, 0.5713348388671875, 0.5959548950195312, 0.620574951171875, 0.6451950073242188, 0.6698150634765625, 0.6944351196289062, 0.71905517578125, 0.7436752319335938, 0.7682952880859375, 0.7929153442382812, 0.817535400390625, 0.8421554565429688, 0.8667755126953125, 0.8913955688476562, 0.916015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 9.0, 23.0, 38.0, 107.0, 216.0, 254.0, 151.0, 98.0, 44.0, 19.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4229354858398438, -3.2424254417419434, -3.061915636062622, -2.8814055919647217, -2.7008957862854004, -2.5203857421875, -2.3398756980895996, -2.1593658924102783, -1.9788559675216675, -1.7983460426330566, -1.6178361177444458, -1.437326192855835, -1.2568161487579346, -1.0763063430786133, -0.8957962989807129, -0.715286374092102, -0.5347764492034912, -0.35426652431488037, -0.17375656962394714, 0.006753385066986084, 0.18726330995559692, 0.36777323484420776, 0.5482832193374634, 0.7287931442260742, 0.9093030691146851, 1.089812994003296, 1.2703229188919067, 1.4508328437805176, 1.631342887878418, 1.8118526935577393, 1.9923627376556396, 2.172872543334961, 2.3533825874328613, 2.5338926315307617, 2.714402437210083, 2.8949124813079834, 3.0754222869873047, 3.255932331085205, 3.4364423751831055, 3.6169521808624268, 3.797461986541748, 3.9779720306396484, 4.158482074737549, 4.338991641998291, 4.519501686096191, 4.700011730194092, 4.880521774291992, 5.061031341552734, 5.241541862487793, 5.422051906585693, 5.602561950683594, 5.783071517944336, 5.963581562042236, 6.144091606140137, 6.324601650238037, 6.5051116943359375, 6.68562126159668, 6.86613130569458, 7.0466413497924805, 7.227150917053223, 7.407660961151123, 7.588171005249023, 7.768681049346924, 7.949191093444824, 8.129700660705566]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 13.0, 21.0, 32.0, 25.0, 34.0, 35.0, 33.0, 51.0, 50.0, 62.0, 61.0, 70.0, 47.0, 56.0, 50.0, 60.0, 36.0, 48.0, 37.0, 33.0, 29.0, 30.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.947227954864502, -2.8547418117523193, -2.7622554302215576, -2.669769287109375, -2.5772831439971924, -2.4847970008850098, -2.392310619354248, -2.2998244762420654, -2.207338333129883, -2.1148521900177, -2.0223658084869385, -1.9298796653747559, -1.8373935222625732, -1.744907259941101, -1.652420997619629, -1.5599348545074463, -1.4674485921859741, -1.374962329864502, -1.2824761867523193, -1.1899899244308472, -1.0975037813186646, -1.0050175189971924, -0.912531316280365, -0.8200451135635376, -0.7275589108467102, -0.6350727081298828, -0.5425865054130554, -0.45010027289390564, -0.35761407017707825, -0.26512786746025085, -0.17264163494110107, -0.08015543222427368, 0.012330770492553711, 0.1048169806599617, 0.1973031908273697, 0.2897894084453583, 0.38227561116218567, 0.47476181387901306, 0.5672480463981628, 0.6597342491149902, 0.7522204518318176, 0.844706654548645, 0.9371928572654724, 1.0296790599822998, 1.122165322303772, 1.2146514654159546, 1.3071377277374268, 1.3996238708496094, 1.4921101331710815, 1.5845963954925537, 1.6770825386047363, 1.7695688009262085, 1.8620549440383911, 1.9545412063598633, 2.047027349472046, 2.1395134925842285, 2.2319998741149902, 2.324486017227173, 2.4169723987579346, 2.509458541870117, 2.6019446849823, 2.6944308280944824, 2.786917209625244, 2.8794033527374268, 2.9718894958496094]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 9.0, 16.0, 11.0, 26.0, 42.0, 44.0, 62.0, 94.0, 171.0, 429.0, 902.0, 2186.0, 6167.0, 23313.0, 103050.0, 620274.0, 232183.0, 42574.0, 11164.0, 3366.0, 1298.0, 566.0, 239.0, 117.0, 74.0, 49.0, 39.0, 23.0, 15.0, 12.0, 8.0, 6.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.208984375, -2.145355224609375, -2.08172607421875, -2.018096923828125, -1.9544677734375, -1.890838623046875, -1.82720947265625, -1.763580322265625, -1.699951171875, -1.636322021484375, -1.57269287109375, -1.509063720703125, -1.4454345703125, -1.381805419921875, -1.31817626953125, -1.254547119140625, -1.19091796875, -1.127288818359375, -1.06365966796875, -1.000030517578125, -0.9364013671875, -0.872772216796875, -0.80914306640625, -0.745513916015625, -0.681884765625, -0.618255615234375, -0.55462646484375, -0.490997314453125, -0.4273681640625, -0.363739013671875, -0.30010986328125, -0.236480712890625, -0.1728515625, -0.109222412109375, -0.04559326171875, 0.018035888671875, 0.0816650390625, 0.145294189453125, 0.20892333984375, 0.272552490234375, 0.336181640625, 0.399810791015625, 0.46343994140625, 0.527069091796875, 0.5906982421875, 0.654327392578125, 0.71795654296875, 0.781585693359375, 0.84521484375, 0.908843994140625, 0.97247314453125, 1.036102294921875, 1.0997314453125, 1.163360595703125, 1.22698974609375, 1.290618896484375, 1.354248046875, 1.417877197265625, 1.48150634765625, 1.545135498046875, 1.6087646484375, 1.672393798828125, 1.73602294921875, 1.799652099609375, 1.86328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 10.0, 12.0, 31.0, 46.0, 57.0, 65.0, 73.0, 66.0, 95.0, 100.0, 98.0, 90.0, 69.0, 57.0, 32.0, 29.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.73114013671875, -0.7142333984375, -0.69732666015625, -0.680419921875, -0.66351318359375, -0.6466064453125, -0.62969970703125, -0.61279296875, -0.59588623046875, -0.5789794921875, -0.56207275390625, -0.545166015625, -0.52825927734375, -0.5113525390625, -0.49444580078125, -0.4775390625, -0.46063232421875, -0.4437255859375, -0.42681884765625, -0.409912109375, -0.39300537109375, -0.3760986328125, -0.35919189453125, -0.34228515625, -0.32537841796875, -0.3084716796875, -0.29156494140625, -0.274658203125, -0.25775146484375, -0.2408447265625, -0.22393798828125, -0.20703125, -0.19012451171875, -0.1732177734375, -0.15631103515625, -0.139404296875, -0.12249755859375, -0.1055908203125, -0.08868408203125, -0.07177734375, -0.05487060546875, -0.0379638671875, -0.02105712890625, -0.004150390625, 0.01275634765625, 0.0296630859375, 0.04656982421875, 0.0634765625, 0.08038330078125, 0.0972900390625, 0.11419677734375, 0.131103515625, 0.14801025390625, 0.1649169921875, 0.18182373046875, 0.19873046875, 0.21563720703125, 0.2325439453125, 0.24945068359375, 0.266357421875, 0.28326416015625, 0.3001708984375, 0.31707763671875, 0.333984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 6.0, 4.0, 14.0, 8.0, 21.0, 27.0, 38.0, 60.0, 79.0, 99.0, 195.0, 286.0, 451.0, 783.0, 1396.0, 2670.0, 5758.0, 13439.0, 36128.0, 117413.0, 521079.0, 248490.0, 61800.0, 21377.0, 8691.0, 3762.0, 1878.0, 996.0, 559.0, 367.0, 222.0, 165.0, 93.0, 72.0, 42.0, 29.0, 16.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5145111083984375, -1.463592529296875, -1.4126739501953125, -1.36175537109375, -1.3108367919921875, -1.259918212890625, -1.2089996337890625, -1.1580810546875, -1.1071624755859375, -1.056243896484375, -1.0053253173828125, -0.95440673828125, -0.9034881591796875, -0.852569580078125, -0.8016510009765625, -0.750732421875, -0.6998138427734375, -0.648895263671875, -0.5979766845703125, -0.54705810546875, -0.4961395263671875, -0.445220947265625, -0.3943023681640625, -0.3433837890625, -0.2924652099609375, -0.241546630859375, -0.1906280517578125, -0.13970947265625, -0.0887908935546875, -0.037872314453125, 0.0130462646484375, 0.06396484375, 0.1148834228515625, 0.165802001953125, 0.2167205810546875, 0.26763916015625, 0.3185577392578125, 0.369476318359375, 0.4203948974609375, 0.4713134765625, 0.5222320556640625, 0.573150634765625, 0.6240692138671875, 0.67498779296875, 0.7259063720703125, 0.776824951171875, 0.8277435302734375, 0.878662109375, 0.9295806884765625, 0.980499267578125, 1.0314178466796875, 1.08233642578125, 1.1332550048828125, 1.184173583984375, 1.2350921630859375, 1.2860107421875, 1.3369293212890625, 1.387847900390625, 1.4387664794921875, 1.48968505859375, 1.5406036376953125, 1.591522216796875, 1.6424407958984375, 1.693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 18.0, 16.0, 17.0, 26.0, 27.0, 35.0, 39.0, 38.0, 41.0, 49.0, 54.0, 54.0, 54.0, 48.0, 52.0, 59.0, 46.0, 41.0, 46.0, 45.0, 36.0, 28.0, 26.0, 17.0, 13.0, 12.0, 10.0, 10.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.288116455078125, -2.21881103515625, -2.149505615234375, -2.0802001953125, -2.010894775390625, -1.94158935546875, -1.872283935546875, -1.802978515625, -1.733673095703125, -1.66436767578125, -1.595062255859375, -1.5257568359375, -1.456451416015625, -1.38714599609375, -1.317840576171875, -1.24853515625, -1.179229736328125, -1.10992431640625, -1.040618896484375, -0.9713134765625, -0.902008056640625, -0.83270263671875, -0.763397216796875, -0.694091796875, -0.624786376953125, -0.55548095703125, -0.486175537109375, -0.4168701171875, -0.347564697265625, -0.27825927734375, -0.208953857421875, -0.1396484375, -0.070343017578125, -0.00103759765625, 0.068267822265625, 0.1375732421875, 0.206878662109375, 0.27618408203125, 0.345489501953125, 0.414794921875, 0.484100341796875, 0.55340576171875, 0.622711181640625, 0.6920166015625, 0.761322021484375, 0.83062744140625, 0.899932861328125, 0.96923828125, 1.038543701171875, 1.10784912109375, 1.177154541015625, 1.2464599609375, 1.315765380859375, 1.38507080078125, 1.454376220703125, 1.523681640625, 1.592987060546875, 1.66229248046875, 1.731597900390625, 1.8009033203125, 1.870208740234375, 1.93951416015625, 2.008819580078125, 2.078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 18.0, 20.0, 43.0, 65.0, 96.0, 134.0, 256.0, 429.0, 812.0, 1680.0, 4412.0, 18028.0, 412152.0, 580704.0, 21186.0, 4701.0, 1813.0, 795.0, 457.0, 294.0, 161.0, 92.0, 58.0, 41.0, 27.0, 17.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4096832275390625, -1.359405517578125, -1.3091278076171875, -1.25885009765625, -1.2085723876953125, -1.158294677734375, -1.1080169677734375, -1.0577392578125, -1.0074615478515625, -0.957183837890625, -0.9069061279296875, -0.85662841796875, -0.8063507080078125, -0.756072998046875, -0.7057952880859375, -0.655517578125, -0.6052398681640625, -0.554962158203125, -0.5046844482421875, -0.45440673828125, -0.4041290283203125, -0.353851318359375, -0.3035736083984375, -0.2532958984375, -0.2030181884765625, -0.152740478515625, -0.1024627685546875, -0.05218505859375, -0.0019073486328125, 0.048370361328125, 0.0986480712890625, 0.14892578125, 0.1992034912109375, 0.249481201171875, 0.2997589111328125, 0.35003662109375, 0.4003143310546875, 0.450592041015625, 0.5008697509765625, 0.5511474609375, 0.6014251708984375, 0.651702880859375, 0.7019805908203125, 0.75225830078125, 0.8025360107421875, 0.852813720703125, 0.9030914306640625, 0.953369140625, 1.0036468505859375, 1.053924560546875, 1.1042022705078125, 1.15447998046875, 1.2047576904296875, 1.255035400390625, 1.3053131103515625, 1.3555908203125, 1.4058685302734375, 1.456146240234375, 1.5064239501953125, 1.55670166015625, 1.6069793701171875, 1.657257080078125, 1.7075347900390625, 1.7578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 17.0, 21.0, 50.0, 102.0, 162.0, 204.0, 171.0, 116.0, 54.0, 33.0, 14.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015350431203842163, -0.00014893710613250732, -0.00014436990022659302, -0.0001398026943206787, -0.0001352354884147644, -0.0001306682825088501, -0.0001261010766029358, -0.00012153387069702148, -0.00011696666479110718, -0.00011239945888519287, -0.00010783225297927856, -0.00010326504707336426, -9.869784116744995e-05, -9.413063526153564e-05, -8.956342935562134e-05, -8.499622344970703e-05, -8.042901754379272e-05, -7.586181163787842e-05, -7.129460573196411e-05, -6.67273998260498e-05, -6.21601939201355e-05, -5.759298801422119e-05, -5.3025782108306885e-05, -4.845857620239258e-05, -4.389137029647827e-05, -3.9324164390563965e-05, -3.475695848464966e-05, -3.018975257873535e-05, -2.5622546672821045e-05, -2.1055340766906738e-05, -1.648813486099243e-05, -1.1920928955078125e-05, -7.353723049163818e-06, -2.7865171432495117e-06, 1.780688762664795e-06, 6.3478946685791016e-06, 1.0915100574493408e-05, 1.5482306480407715e-05, 2.004951238632202e-05, 2.4616718292236328e-05, 2.9183924198150635e-05, 3.375113010406494e-05, 3.831833600997925e-05, 4.2885541915893555e-05, 4.745274782180786e-05, 5.201995372772217e-05, 5.6587159633636475e-05, 6.115436553955078e-05, 6.572157144546509e-05, 7.02887773513794e-05, 7.48559832572937e-05, 7.942318916320801e-05, 8.399039506912231e-05, 8.855760097503662e-05, 9.312480688095093e-05, 9.769201278686523e-05, 0.00010225921869277954, 0.00010682642459869385, 0.00011139363050460815, 0.00011596083641052246, 0.00012052804231643677, 0.00012509524822235107, 0.00012966245412826538, 0.0001342296600341797]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 10.0, 14.0, 23.0, 34.0, 61.0, 85.0, 130.0, 218.0, 368.0, 700.0, 1477.0, 3616.0, 11393.0, 83809.0, 848821.0, 80007.0, 11170.0, 3465.0, 1467.0, 692.0, 371.0, 213.0, 136.0, 89.0, 58.0, 25.0, 32.0, 14.0, 13.0, 12.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3203125, -1.283111572265625, -1.24591064453125, -1.208709716796875, -1.1715087890625, -1.134307861328125, -1.09710693359375, -1.059906005859375, -1.022705078125, -0.985504150390625, -0.94830322265625, -0.911102294921875, -0.8739013671875, -0.836700439453125, -0.79949951171875, -0.762298583984375, -0.72509765625, -0.687896728515625, -0.65069580078125, -0.613494873046875, -0.5762939453125, -0.539093017578125, -0.50189208984375, -0.464691162109375, -0.427490234375, -0.390289306640625, -0.35308837890625, -0.315887451171875, -0.2786865234375, -0.241485595703125, -0.20428466796875, -0.167083740234375, -0.1298828125, -0.092681884765625, -0.05548095703125, -0.018280029296875, 0.0189208984375, 0.056121826171875, 0.09332275390625, 0.130523681640625, 0.167724609375, 0.204925537109375, 0.24212646484375, 0.279327392578125, 0.3165283203125, 0.353729248046875, 0.39093017578125, 0.428131103515625, 0.46533203125, 0.502532958984375, 0.53973388671875, 0.576934814453125, 0.6141357421875, 0.651336669921875, 0.68853759765625, 0.725738525390625, 0.762939453125, 0.800140380859375, 0.83734130859375, 0.874542236328125, 0.9117431640625, 0.948944091796875, 0.98614501953125, 1.023345947265625, 1.060546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 10.0, 17.0, 26.0, 43.0, 66.0, 107.0, 219.0, 205.0, 119.0, 72.0, 35.0, 24.0, 12.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.25042724609375, -1.2039794921875, -1.15753173828125, -1.111083984375, -1.06463623046875, -1.0181884765625, -0.97174072265625, -0.92529296875, -0.87884521484375, -0.8323974609375, -0.78594970703125, -0.739501953125, -0.69305419921875, -0.6466064453125, -0.60015869140625, -0.5537109375, -0.50726318359375, -0.4608154296875, -0.41436767578125, -0.367919921875, -0.32147216796875, -0.2750244140625, -0.22857666015625, -0.18212890625, -0.13568115234375, -0.0892333984375, -0.04278564453125, 0.003662109375, 0.05010986328125, 0.0965576171875, 0.14300537109375, 0.189453125, 0.23590087890625, 0.2823486328125, 0.32879638671875, 0.375244140625, 0.42169189453125, 0.4681396484375, 0.51458740234375, 0.56103515625, 0.60748291015625, 0.6539306640625, 0.70037841796875, 0.746826171875, 0.79327392578125, 0.8397216796875, 0.88616943359375, 0.9326171875, 0.97906494140625, 1.0255126953125, 1.07196044921875, 1.118408203125, 1.16485595703125, 1.2113037109375, 1.25775146484375, 1.30419921875, 1.35064697265625, 1.3970947265625, 1.44354248046875, 1.489990234375, 1.53643798828125, 1.5828857421875, 1.62933349609375, 1.67578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 11.0, 16.0, 26.0, 52.0, 124.0, 225.0, 295.0, 138.0, 51.0, 33.0, 21.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.71803283691406, -41.811527252197266, -40.90502166748047, -39.99851608276367, -39.092010498046875, -38.18550491333008, -37.27899932861328, -36.372493743896484, -35.46598815917969, -34.55948257446289, -33.652976989746094, -32.7464714050293, -31.8399658203125, -30.933460235595703, -30.026954650878906, -29.12044906616211, -28.213943481445312, -27.307437896728516, -26.40093231201172, -25.494426727294922, -24.587921142578125, -23.681415557861328, -22.77490997314453, -21.868404388427734, -20.96190071105957, -20.055395126342773, -19.148889541625977, -18.24238395690918, -17.335878372192383, -16.429372787475586, -15.522867202758789, -14.616361618041992, -13.709855079650879, -12.803349494934082, -11.896843910217285, -10.990338325500488, -10.083832740783691, -9.177328109741211, -8.270822525024414, -7.364316463470459, -6.457810878753662, -5.551305294036865, -4.644799709320068, -3.7382943630218506, -2.8317887783050537, -1.925283432006836, -1.018777847290039, -0.11227226257324219, 0.7942333221435547, 1.7007389068603516, 2.6072444915771484, 3.513749837875366, 4.420255661010742, 5.326760768890381, 6.233266353607178, 7.139771938323975, 8.04627799987793, 8.952783584594727, 9.859289169311523, 10.76579475402832, 11.672300338745117, 12.578805923461914, 13.485311508178711, 14.391817092895508, 15.298321723937988]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 12.0, 12.0, 7.0, 10.0, 12.0, 21.0, 13.0, 26.0, 21.0, 29.0, 28.0, 26.0, 30.0, 59.0, 48.0, 47.0, 48.0, 51.0, 59.0, 52.0, 55.0, 45.0, 37.0, 31.0, 38.0, 38.0, 20.0, 26.0, 15.0, 17.0, 17.0, 6.0, 12.0, 4.0, 3.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.458839416503906, -14.010566711425781, -13.562294006347656, -13.114022254943848, -12.665749549865723, -12.217476844787598, -11.769204139709473, -11.320932388305664, -10.872659683227539, -10.424386978149414, -9.976114273071289, -9.52784252166748, -9.079569816589355, -8.63129711151123, -8.183024406433105, -7.734752178192139, -7.286479473114014, -6.838206768035889, -6.389934539794922, -5.941661834716797, -5.49338960647583, -5.045116901397705, -4.596844673156738, -4.148571968078613, -3.7002995014190674, -3.2520270347595215, -2.8037545680999756, -2.3554821014404297, -1.9072095155715942, -1.4589369297027588, -1.010664463043213, -0.562391996383667, -0.1141195297241211, 0.3341529667377472, 0.7824254631996155, 1.2306979894638062, 1.678970456123352, 2.1272430419921875, 2.5755155086517334, 3.0237879753112793, 3.472060441970825, 3.920332908630371, 4.368605613708496, 4.816877841949463, 5.265150547027588, 5.713422775268555, 6.16169548034668, 6.609968185424805, 7.0582404136657715, 7.5065131187438965, 7.954785346984863, 8.403058052062988, 8.851330757141113, 9.299602508544922, 9.747875213623047, 10.196147918701172, 10.644420623779297, 11.092693328857422, 11.540966033935547, 11.989237785339355, 12.43751049041748, 12.885783195495605, 13.33405590057373, 13.782327651977539, 14.230600357055664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 14.0, 14.0, 21.0, 26.0, 28.0, 69.0, 93.0, 148.0, 251.0, 389.0, 635.0, 1131.0, 2186.0, 4513.0, 20267.0, 4144184.0, 12124.0, 3813.0, 1863.0, 1048.0, 554.0, 328.0, 213.0, 131.0, 73.0, 63.0, 33.0, 20.0, 16.0, 6.0, 12.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.703125, -4.5894775390625, -4.475830078125, -4.3621826171875, -4.24853515625, -4.1348876953125, -4.021240234375, -3.9075927734375, -3.7939453125, -3.6802978515625, -3.566650390625, -3.4530029296875, -3.33935546875, -3.2257080078125, -3.112060546875, -2.9984130859375, -2.884765625, -2.7711181640625, -2.657470703125, -2.5438232421875, -2.43017578125, -2.3165283203125, -2.202880859375, -2.0892333984375, -1.9755859375, -1.8619384765625, -1.748291015625, -1.6346435546875, -1.52099609375, -1.4073486328125, -1.293701171875, -1.1800537109375, -1.06640625, -0.9527587890625, -0.839111328125, -0.7254638671875, -0.61181640625, -0.4981689453125, -0.384521484375, -0.2708740234375, -0.1572265625, -0.0435791015625, 0.070068359375, 0.1837158203125, 0.29736328125, 0.4110107421875, 0.524658203125, 0.6383056640625, 0.751953125, 0.8656005859375, 0.979248046875, 1.0928955078125, 1.20654296875, 1.3201904296875, 1.433837890625, 1.5474853515625, 1.6611328125, 1.7747802734375, 1.888427734375, 2.0020751953125, 2.11572265625, 2.2293701171875, 2.343017578125, 2.4566650390625, 2.5703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 8.0, 14.0, 15.0, 16.0, 22.0, 30.0, 45.0, 42.0, 62.0, 68.0, 60.0, 58.0, 72.0, 79.0, 81.0, 74.0, 57.0, 46.0, 37.0, 25.0, 24.0, 14.0, 4.0, 15.0, 10.0, 11.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7876091003417969, -0.7676010131835938, -0.7475929260253906, -0.7275848388671875, -0.7075767517089844, -0.6875686645507812, -0.6675605773925781, -0.647552490234375, -0.6275444030761719, -0.6075363159179688, -0.5875282287597656, -0.5675201416015625, -0.5475120544433594, -0.5275039672851562, -0.5074958801269531, -0.48748779296875, -0.4674797058105469, -0.44747161865234375, -0.4274635314941406, -0.4074554443359375, -0.3874473571777344, -0.36743927001953125, -0.3474311828613281, -0.327423095703125, -0.3074150085449219, -0.28740692138671875, -0.2673988342285156, -0.2473907470703125, -0.22738265991210938, -0.20737457275390625, -0.18736648559570312, -0.1673583984375, -0.14735031127929688, -0.12734222412109375, -0.10733413696289062, -0.0873260498046875, -0.06731796264648438, -0.04730987548828125, -0.027301788330078125, -0.007293701171875, 0.012714385986328125, 0.03272247314453125, 0.052730560302734375, 0.0727386474609375, 0.09274673461914062, 0.11275482177734375, 0.13276290893554688, 0.15277099609375, 0.17277908325195312, 0.19278717041015625, 0.21279525756835938, 0.2328033447265625, 0.2528114318847656, 0.27281951904296875, 0.2928276062011719, 0.312835693359375, 0.3328437805175781, 0.35285186767578125, 0.3728599548339844, 0.3928680419921875, 0.4128761291503906, 0.43288421630859375, 0.4528923034667969, 0.472900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 9.0, 18.0, 13.0, 27.0, 24.0, 41.0, 62.0, 84.0, 91.0, 145.0, 201.0, 282.0, 391.0, 609.0, 897.0, 1374.0, 2649.0, 5987.0, 19134.0, 4101665.0, 43373.0, 8800.0, 3402.0, 1735.0, 1022.0, 661.0, 446.0, 327.0, 199.0, 149.0, 125.0, 77.0, 65.0, 54.0, 35.0, 22.0, 21.0, 11.0, 14.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.926116943359375, -2.83074951171875, -2.735382080078125, -2.6400146484375, -2.544647216796875, -2.44927978515625, -2.353912353515625, -2.258544921875, -2.163177490234375, -2.06781005859375, -1.972442626953125, -1.8770751953125, -1.781707763671875, -1.68634033203125, -1.590972900390625, -1.49560546875, -1.400238037109375, -1.30487060546875, -1.209503173828125, -1.1141357421875, -1.018768310546875, -0.92340087890625, -0.828033447265625, -0.732666015625, -0.637298583984375, -0.54193115234375, -0.446563720703125, -0.3511962890625, -0.255828857421875, -0.16046142578125, -0.065093994140625, 0.0302734375, 0.125640869140625, 0.22100830078125, 0.316375732421875, 0.4117431640625, 0.507110595703125, 0.60247802734375, 0.697845458984375, 0.793212890625, 0.888580322265625, 0.98394775390625, 1.079315185546875, 1.1746826171875, 1.270050048828125, 1.36541748046875, 1.460784912109375, 1.55615234375, 1.651519775390625, 1.74688720703125, 1.842254638671875, 1.9376220703125, 2.032989501953125, 2.12835693359375, 2.223724365234375, 2.319091796875, 2.414459228515625, 2.50982666015625, 2.605194091796875, 2.7005615234375, 2.795928955078125, 2.89129638671875, 2.986663818359375, 3.08203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 9.0, 26.0, 100.0, 3799.0, 58.0, 20.0, 16.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6615142822265625, -0.640411376953125, -0.6193084716796875, -0.59820556640625, -0.5771026611328125, -0.555999755859375, -0.5348968505859375, -0.5137939453125, -0.4926910400390625, -0.471588134765625, -0.4504852294921875, -0.42938232421875, -0.4082794189453125, -0.387176513671875, -0.3660736083984375, -0.344970703125, -0.3238677978515625, -0.302764892578125, -0.2816619873046875, -0.26055908203125, -0.2394561767578125, -0.218353271484375, -0.1972503662109375, -0.1761474609375, -0.1550445556640625, -0.133941650390625, -0.1128387451171875, -0.09173583984375, -0.0706329345703125, -0.049530029296875, -0.0284271240234375, -0.00732421875, 0.0137786865234375, 0.034881591796875, 0.0559844970703125, 0.07708740234375, 0.0981903076171875, 0.119293212890625, 0.1403961181640625, 0.1614990234375, 0.1826019287109375, 0.203704833984375, 0.2248077392578125, 0.24591064453125, 0.2670135498046875, 0.288116455078125, 0.3092193603515625, 0.330322265625, 0.3514251708984375, 0.372528076171875, 0.3936309814453125, 0.41473388671875, 0.4358367919921875, 0.456939697265625, 0.4780426025390625, 0.4991455078125, 0.5202484130859375, 0.541351318359375, 0.5624542236328125, 0.58355712890625, 0.6046600341796875, 0.625762939453125, 0.6468658447265625, 0.66796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 9.0, 34.0, 69.0, 108.0, 244.0, 277.0, 154.0, 55.0, 29.0, 15.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.771570205688477, -5.6543707847595215, -5.537170886993408, -5.419971466064453, -5.30277156829834, -5.185572147369385, -5.0683722496032715, -4.951172828674316, -4.833972930908203, -4.716773509979248, -4.599573612213135, -4.48237419128418, -4.365174293518066, -4.247974872589111, -4.130774974822998, -4.013575553894043, -3.896376132965088, -3.7791764736175537, -3.6619768142700195, -3.5447771549224854, -3.427577495574951, -3.310378074645996, -3.193178415298462, -3.0759787559509277, -2.9587790966033936, -2.8415794372558594, -2.724379777908325, -2.607180118560791, -2.489980697631836, -2.3727807998657227, -2.2555813789367676, -2.1383817195892334, -2.0211822986602783, -1.9039826393127441, -1.78678297996521, -1.6695834398269653, -1.5523837804794312, -1.435184121131897, -1.3179845809936523, -1.2007849216461182, -1.083585262298584, -0.9663856029510498, -0.8491860032081604, -0.731986403465271, -0.6147867441177368, -0.49758708477020264, -0.38038748502731323, -0.26318788528442383, -0.14598822593688965, -0.028788596391677856, 0.08841103315353394, 0.20561066269874573, 0.3228102922439575, 0.4400099515914917, 0.5572095513343811, 0.6744091510772705, 0.7916088104248047, 0.9088084697723389, 1.026008129119873, 1.1432076692581177, 1.2604073286056519, 1.377606987953186, 1.4948065280914307, 1.6120061874389648, 1.729205846786499]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 13.0, 9.0, 17.0, 23.0, 26.0, 33.0, 30.0, 39.0, 33.0, 47.0, 43.0, 43.0, 46.0, 51.0, 36.0, 44.0, 52.0, 43.0, 37.0, 47.0, 29.0, 32.0, 32.0, 36.0, 24.0, 20.0, 19.0, 18.0, 9.0, 12.0, 10.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0555193424224854, -1.0179657936096191, -0.9804121255874634, -0.9428585767745972, -0.9053049683570862, -0.8677513599395752, -0.8301977515220642, -0.7926441431045532, -0.755090594291687, -0.717536985874176, -0.679983377456665, -0.6424298286437988, -0.6048762202262878, -0.5673226118087769, -0.5297690033912659, -0.49221542477607727, -0.4546617865562439, -0.4171081781387329, -0.3795545995235443, -0.3420009911060333, -0.3044474124908447, -0.26689380407333374, -0.22934019565582275, -0.19178661704063416, -0.15423300862312317, -0.11667941510677338, -0.07912581413984299, -0.0415722131729126, -0.004018619656562805, 0.03353497385978699, 0.07108858227729797, 0.10864216089248657, 0.14619576930999756, 0.18374936282634735, 0.22130295634269714, 0.25885656476020813, 0.29641014337539673, 0.3339637517929077, 0.3715173602104187, 0.4090709388256073, 0.4466245472431183, 0.4841781556606293, 0.5217317342758179, 0.5592853426933289, 0.5968389511108398, 0.634392499923706, 0.6719461679458618, 0.709499716758728, 0.747053325176239, 0.78460693359375, 0.822160542011261, 0.859714150428772, 0.8972676992416382, 0.9348213076591492, 0.9723749160766602, 1.0099284648895264, 1.0474821329116821, 1.0850356817245483, 1.122589349746704, 1.1601428985595703, 1.197696566581726, 1.2352501153945923, 1.272803783416748, 1.3103573322296143, 1.3479108810424805]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 1.0, 4.0, 8.0, 7.0, 18.0, 13.0, 28.0, 48.0, 61.0, 94.0, 140.0, 225.0, 352.0, 594.0, 1143.0, 2235.0, 4557.0, 9987.0, 25379.0, 76105.0, 303199.0, 449347.0, 114451.0, 35269.0, 13441.0, 5661.0, 2806.0, 1446.0, 784.0, 431.0, 245.0, 162.0, 114.0, 63.0, 48.0, 17.0, 26.0, 11.0, 9.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.95068359375, -1.8837890625, -1.81689453125, -1.75, -1.68310546875, -1.6162109375, -1.54931640625, -1.482421875, -1.41552734375, -1.3486328125, -1.28173828125, -1.21484375, -1.14794921875, -1.0810546875, -1.01416015625, -0.947265625, -0.88037109375, -0.8134765625, -0.74658203125, -0.6796875, -0.61279296875, -0.5458984375, -0.47900390625, -0.412109375, -0.34521484375, -0.2783203125, -0.21142578125, -0.14453125, -0.07763671875, -0.0107421875, 0.05615234375, 0.123046875, 0.18994140625, 0.2568359375, 0.32373046875, 0.390625, 0.45751953125, 0.5244140625, 0.59130859375, 0.658203125, 0.72509765625, 0.7919921875, 0.85888671875, 0.92578125, 0.99267578125, 1.0595703125, 1.12646484375, 1.193359375, 1.26025390625, 1.3271484375, 1.39404296875, 1.4609375, 1.52783203125, 1.5947265625, 1.66162109375, 1.728515625, 1.79541015625, 1.8623046875, 1.92919921875, 1.99609375, 2.06298828125, 2.1298828125, 2.19677734375, 2.263671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 1.0, 11.0, 12.0, 19.0, 18.0, 27.0, 34.0, 47.0, 53.0, 62.0, 48.0, 60.0, 62.0, 96.0, 57.0, 72.0, 64.0, 62.0, 40.0, 37.0, 25.0, 22.0, 17.0, 12.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.794921875, -0.7746047973632812, -0.7542877197265625, -0.7339706420898438, -0.713653564453125, -0.6933364868164062, -0.6730194091796875, -0.6527023315429688, -0.63238525390625, -0.6120681762695312, -0.5917510986328125, -0.5714340209960938, -0.551116943359375, -0.5307998657226562, -0.5104827880859375, -0.49016571044921875, -0.4698486328125, -0.44953155517578125, -0.4292144775390625, -0.40889739990234375, -0.388580322265625, -0.36826324462890625, -0.3479461669921875, -0.32762908935546875, -0.30731201171875, -0.28699493408203125, -0.2666778564453125, -0.24636077880859375, -0.226043701171875, -0.20572662353515625, -0.1854095458984375, -0.16509246826171875, -0.144775390625, -0.12445831298828125, -0.1041412353515625, -0.08382415771484375, -0.063507080078125, -0.04319000244140625, -0.0228729248046875, -0.00255584716796875, 0.01776123046875, 0.03807830810546875, 0.0583953857421875, 0.07871246337890625, 0.099029541015625, 0.11934661865234375, 0.1396636962890625, 0.15998077392578125, 0.1802978515625, 0.20061492919921875, 0.2209320068359375, 0.24124908447265625, 0.261566162109375, 0.28188323974609375, 0.3022003173828125, 0.32251739501953125, 0.34283447265625, 0.36315155029296875, 0.3834686279296875, 0.40378570556640625, 0.424102783203125, 0.44441986083984375, 0.4647369384765625, 0.48505401611328125, 0.50537109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 16.0, 17.0, 27.0, 36.0, 85.0, 98.0, 149.0, 294.0, 523.0, 953.0, 2032.0, 5184.0, 15470.0, 66025.0, 583324.0, 312444.0, 42767.0, 11543.0, 4028.0, 1659.0, 835.0, 409.0, 231.0, 131.0, 73.0, 60.0, 36.0, 36.0, 21.0, 13.0, 7.0, 12.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.841796875, -3.72491455078125, -3.6080322265625, -3.49114990234375, -3.374267578125, -3.25738525390625, -3.1405029296875, -3.02362060546875, -2.90673828125, -2.78985595703125, -2.6729736328125, -2.55609130859375, -2.439208984375, -2.32232666015625, -2.2054443359375, -2.08856201171875, -1.9716796875, -1.85479736328125, -1.7379150390625, -1.62103271484375, -1.504150390625, -1.38726806640625, -1.2703857421875, -1.15350341796875, -1.03662109375, -0.91973876953125, -0.8028564453125, -0.68597412109375, -0.569091796875, -0.45220947265625, -0.3353271484375, -0.21844482421875, -0.1015625, 0.01531982421875, 0.1322021484375, 0.24908447265625, 0.365966796875, 0.48284912109375, 0.5997314453125, 0.71661376953125, 0.83349609375, 0.95037841796875, 1.0672607421875, 1.18414306640625, 1.301025390625, 1.41790771484375, 1.5347900390625, 1.65167236328125, 1.7685546875, 1.88543701171875, 2.0023193359375, 2.11920166015625, 2.236083984375, 2.35296630859375, 2.4698486328125, 2.58673095703125, 2.70361328125, 2.82049560546875, 2.9373779296875, 3.05426025390625, 3.171142578125, 3.28802490234375, 3.4049072265625, 3.52178955078125, 3.638671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 19.0, 20.0, 27.0, 29.0, 43.0, 41.0, 65.0, 52.0, 62.0, 74.0, 63.0, 57.0, 65.0, 62.0, 48.0, 48.0, 42.0, 34.0, 21.0, 24.0, 17.0, 10.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.266265869140625, -3.12042236328125, -2.974578857421875, -2.8287353515625, -2.682891845703125, -2.53704833984375, -2.391204833984375, -2.245361328125, -2.099517822265625, -1.95367431640625, -1.807830810546875, -1.6619873046875, -1.516143798828125, -1.37030029296875, -1.224456787109375, -1.07861328125, -0.932769775390625, -0.78692626953125, -0.641082763671875, -0.4952392578125, -0.349395751953125, -0.20355224609375, -0.057708740234375, 0.088134765625, 0.233978271484375, 0.37982177734375, 0.525665283203125, 0.6715087890625, 0.817352294921875, 0.96319580078125, 1.109039306640625, 1.2548828125, 1.400726318359375, 1.54656982421875, 1.692413330078125, 1.8382568359375, 1.984100341796875, 2.12994384765625, 2.275787353515625, 2.421630859375, 2.567474365234375, 2.71331787109375, 2.859161376953125, 3.0050048828125, 3.150848388671875, 3.29669189453125, 3.442535400390625, 3.58837890625, 3.734222412109375, 3.88006591796875, 4.025909423828125, 4.1717529296875, 4.317596435546875, 4.46343994140625, 4.609283447265625, 4.755126953125, 4.900970458984375, 5.04681396484375, 5.192657470703125, 5.3385009765625, 5.484344482421875, 5.63018798828125, 5.776031494140625, 5.921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 10.0, 24.0, 40.0, 52.0, 72.0, 107.0, 188.0, 290.0, 488.0, 979.0, 2019.0, 5374.0, 21817.0, 297703.0, 675404.0, 32202.0, 6757.0, 2428.0, 1106.0, 587.0, 335.0, 197.0, 139.0, 52.0, 53.0, 31.0, 28.0, 13.0, 11.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.712890625, -2.6397705078125, -2.566650390625, -2.4935302734375, -2.42041015625, -2.3472900390625, -2.274169921875, -2.2010498046875, -2.1279296875, -2.0548095703125, -1.981689453125, -1.9085693359375, -1.83544921875, -1.7623291015625, -1.689208984375, -1.6160888671875, -1.54296875, -1.4698486328125, -1.396728515625, -1.3236083984375, -1.25048828125, -1.1773681640625, -1.104248046875, -1.0311279296875, -0.9580078125, -0.8848876953125, -0.811767578125, -0.7386474609375, -0.66552734375, -0.5924072265625, -0.519287109375, -0.4461669921875, -0.373046875, -0.2999267578125, -0.226806640625, -0.1536865234375, -0.08056640625, -0.0074462890625, 0.065673828125, 0.1387939453125, 0.2119140625, 0.2850341796875, 0.358154296875, 0.4312744140625, 0.50439453125, 0.5775146484375, 0.650634765625, 0.7237548828125, 0.796875, 0.8699951171875, 0.943115234375, 1.0162353515625, 1.08935546875, 1.1624755859375, 1.235595703125, 1.3087158203125, 1.3818359375, 1.4549560546875, 1.528076171875, 1.6011962890625, 1.67431640625, 1.7474365234375, 1.820556640625, 1.8936767578125, 1.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 11.0, 15.0, 37.0, 102.0, 219.0, 321.0, 163.0, 64.0, 29.0, 19.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047588348388671875, -0.00046237558126449585, -0.00044886767864227295, -0.00043535977602005005, -0.00042185187339782715, -0.00040834397077560425, -0.00039483606815338135, -0.00038132816553115845, -0.00036782026290893555, -0.00035431236028671265, -0.00034080445766448975, -0.00032729655504226685, -0.00031378865242004395, -0.00030028074979782104, -0.00028677284717559814, -0.00027326494455337524, -0.00025975704193115234, -0.00024624913930892944, -0.00023274123668670654, -0.00021923333406448364, -0.00020572543144226074, -0.00019221752882003784, -0.00017870962619781494, -0.00016520172357559204, -0.00015169382095336914, -0.00013818591833114624, -0.00012467801570892334, -0.00011117011308670044, -9.766221046447754e-05, -8.415430784225464e-05, -7.064640522003174e-05, -5.713850259780884e-05, -4.363059997558594e-05, -3.0122697353363037e-05, -1.6614794731140137e-05, -3.1068921089172363e-06, 1.0401010513305664e-05, 2.3908913135528564e-05, 3.7416815757751465e-05, 5.0924718379974365e-05, 6.443262100219727e-05, 7.794052362442017e-05, 9.144842624664307e-05, 0.00010495632886886597, 0.00011846423149108887, 0.00013197213411331177, 0.00014548003673553467, 0.00015898793935775757, 0.00017249584197998047, 0.00018600374460220337, 0.00019951164722442627, 0.00021301954984664917, 0.00022652745246887207, 0.00024003535509109497, 0.00025354325771331787, 0.00026705116033554077, 0.00028055906295776367, 0.00029406696557998657, 0.00030757486820220947, 0.0003210827708244324, 0.0003345906734466553, 0.0003480985760688782, 0.0003616064786911011, 0.000375114381313324, 0.0003886222839355469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 5.0, 12.0, 8.0, 12.0, 16.0, 29.0, 41.0, 41.0, 86.0, 115.0, 194.0, 315.0, 596.0, 1175.0, 2564.0, 6909.0, 26923.0, 236422.0, 701800.0, 53513.0, 10737.0, 3611.0, 1571.0, 750.0, 430.0, 239.0, 164.0, 89.0, 54.0, 34.0, 28.0, 18.0, 9.0, 8.0, 12.0, 7.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2932586669921875, -1.245697021484375, -1.1981353759765625, -1.15057373046875, -1.1030120849609375, -1.055450439453125, -1.0078887939453125, -0.9603271484375, -0.9127655029296875, -0.865203857421875, -0.8176422119140625, -0.77008056640625, -0.7225189208984375, -0.674957275390625, -0.6273956298828125, -0.579833984375, -0.5322723388671875, -0.484710693359375, -0.4371490478515625, -0.38958740234375, -0.3420257568359375, -0.294464111328125, -0.2469024658203125, -0.1993408203125, -0.1517791748046875, -0.104217529296875, -0.0566558837890625, -0.00909423828125, 0.0384674072265625, 0.086029052734375, 0.1335906982421875, 0.18115234375, 0.2287139892578125, 0.276275634765625, 0.3238372802734375, 0.37139892578125, 0.4189605712890625, 0.466522216796875, 0.5140838623046875, 0.5616455078125, 0.6092071533203125, 0.656768798828125, 0.7043304443359375, 0.75189208984375, 0.7994537353515625, 0.847015380859375, 0.8945770263671875, 0.942138671875, 0.9897003173828125, 1.037261962890625, 1.0848236083984375, 1.13238525390625, 1.1799468994140625, 1.227508544921875, 1.2750701904296875, 1.3226318359375, 1.3701934814453125, 1.417755126953125, 1.4653167724609375, 1.51287841796875, 1.5604400634765625, 1.608001708984375, 1.6555633544921875, 1.703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 13.0, 24.0, 27.0, 38.0, 50.0, 51.0, 103.0, 168.0, 121.0, 98.0, 64.0, 38.0, 35.0, 27.0, 30.0, 19.0, 15.0, 8.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5205078125, -1.4639129638671875, -1.407318115234375, -1.3507232666015625, -1.29412841796875, -1.2375335693359375, -1.180938720703125, -1.1243438720703125, -1.0677490234375, -1.0111541748046875, -0.954559326171875, -0.8979644775390625, -0.84136962890625, -0.7847747802734375, -0.728179931640625, -0.6715850830078125, -0.614990234375, -0.5583953857421875, -0.501800537109375, -0.4452056884765625, -0.38861083984375, -0.3320159912109375, -0.275421142578125, -0.2188262939453125, -0.1622314453125, -0.1056365966796875, -0.049041748046875, 0.0075531005859375, 0.06414794921875, 0.1207427978515625, 0.177337646484375, 0.2339324951171875, 0.29052734375, 0.3471221923828125, 0.403717041015625, 0.4603118896484375, 0.51690673828125, 0.5735015869140625, 0.630096435546875, 0.6866912841796875, 0.7432861328125, 0.7998809814453125, 0.856475830078125, 0.9130706787109375, 0.96966552734375, 1.0262603759765625, 1.082855224609375, 1.1394500732421875, 1.196044921875, 1.2526397705078125, 1.309234619140625, 1.3658294677734375, 1.42242431640625, 1.4790191650390625, 1.535614013671875, 1.5922088623046875, 1.6488037109375, 1.7053985595703125, 1.761993408203125, 1.8185882568359375, 1.87518310546875, 1.9317779541015625, 1.988372802734375, 2.0449676513671875, 2.1015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 15.0, 17.0, 23.0, 45.0, 58.0, 103.0, 155.0, 196.0, 137.0, 114.0, 55.0, 26.0, 20.0, 14.0, 9.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.74540901184082, -29.62629508972168, -28.50718116760254, -27.3880672454834, -26.26895523071289, -25.14984130859375, -24.03072738647461, -22.91161346435547, -21.792499542236328, -20.673385620117188, -19.554271697998047, -18.435157775878906, -17.316043853759766, -16.196929931640625, -15.077817916870117, -13.958703994750977, -12.839590072631836, -11.720476150512695, -10.601362228393555, -9.48224925994873, -8.36313533782959, -7.244021415710449, -6.124907970428467, -5.005794525146484, -3.8866806030273438, -2.7675669193267822, -1.6484532356262207, -0.5293395519256592, 0.5897741317749023, 1.708888053894043, 2.8280014991760254, 3.947114944458008, 5.066226959228516, 6.185340881347656, 7.304454326629639, 8.423567771911621, 9.542681694030762, 10.661795616149902, 11.780908584594727, 12.900022506713867, 14.019136428833008, 15.138250350952148, 16.25736427307129, 17.37647819519043, 18.495590209960938, 19.614704132080078, 20.73381805419922, 21.85293197631836, 22.9720458984375, 24.09115982055664, 25.21027374267578, 26.329387664794922, 27.448501586914062, 28.567615509033203, 29.68672752380371, 30.80584144592285, 31.924955368041992, 33.0440673828125, 34.16318130493164, 35.28229522705078, 36.40140914916992, 37.52052307128906, 38.6396369934082, 39.758750915527344, 40.877864837646484]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 11.0, 11.0, 15.0, 18.0, 26.0, 26.0, 26.0, 45.0, 58.0, 55.0, 78.0, 62.0, 65.0, 75.0, 58.0, 47.0, 58.0, 34.0, 38.0, 30.0, 29.0, 18.0, 23.0, 12.0, 12.0, 11.0, 7.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.724720001220703, -28.909807205200195, -28.094894409179688, -27.279979705810547, -26.46506690979004, -25.65015411376953, -24.835241317749023, -24.020328521728516, -23.205413818359375, -22.390501022338867, -21.57558822631836, -20.76067352294922, -19.94576072692871, -19.130847930908203, -18.315935134887695, -17.501022338867188, -16.686107635498047, -15.871194839477539, -15.056281089782715, -14.241368293762207, -13.426454544067383, -12.611541748046875, -11.796628952026367, -10.981715202331543, -10.166803359985352, -9.351890563964844, -8.53697681427002, -7.722064018249512, -6.9071502685546875, -6.09223747253418, -5.277324199676514, -4.462410926818848, -3.6474971771240234, -2.8325839042663574, -2.0176706314086914, -1.2027575969696045, -0.3878443241119385, 0.42706871032714844, 1.2419819831848145, 2.0568952560424805, 2.8718085289001465, 3.6867218017578125, 4.5016350746154785, 5.3165483474731445, 6.131461143493652, 6.946374416351318, 7.761287689208984, 8.576200485229492, 9.391114234924316, 10.206027030944824, 11.020940780639648, 11.835853576660156, 12.65076732635498, 13.465680122375488, 14.280593872070312, 15.09550666809082, 15.910419464111328, 16.725332260131836, 17.540245056152344, 18.355159759521484, 19.170072555541992, 19.9849853515625, 20.799898147583008, 21.614810943603516, 22.429725646972656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 8.0, 2.0, 9.0, 9.0, 7.0, 13.0, 17.0, 25.0, 31.0, 23.0, 53.0, 91.0, 122.0, 207.0, 341.0, 598.0, 1179.0, 2676.0, 7419.0, 46596.0, 4108544.0, 17963.0, 4701.0, 1845.0, 849.0, 402.0, 216.0, 129.0, 72.0, 43.0, 25.0, 17.0, 15.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.96026611328125, -7.7408447265625, -7.52142333984375, -7.302001953125, -7.08258056640625, -6.8631591796875, -6.64373779296875, -6.42431640625, -6.20489501953125, -5.9854736328125, -5.76605224609375, -5.546630859375, -5.32720947265625, -5.1077880859375, -4.88836669921875, -4.6689453125, -4.44952392578125, -4.2301025390625, -4.01068115234375, -3.791259765625, -3.57183837890625, -3.3524169921875, -3.13299560546875, -2.91357421875, -2.69415283203125, -2.4747314453125, -2.25531005859375, -2.035888671875, -1.81646728515625, -1.5970458984375, -1.37762451171875, -1.158203125, -0.93878173828125, -0.7193603515625, -0.49993896484375, -0.280517578125, -0.06109619140625, 0.1583251953125, 0.37774658203125, 0.59716796875, 0.81658935546875, 1.0360107421875, 1.25543212890625, 1.474853515625, 1.69427490234375, 1.9136962890625, 2.13311767578125, 2.3525390625, 2.57196044921875, 2.7913818359375, 3.01080322265625, 3.230224609375, 3.44964599609375, 3.6690673828125, 3.88848876953125, 4.10791015625, 4.32733154296875, 4.5467529296875, 4.76617431640625, 4.985595703125, 5.20501708984375, 5.4244384765625, 5.64385986328125, 5.86328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 3.0, 6.0, 12.0, 12.0, 17.0, 25.0, 38.0, 50.0, 64.0, 93.0, 110.0, 107.0, 96.0, 90.0, 90.0, 62.0, 39.0, 19.0, 18.0, 13.0, 8.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.34271240234375, -1.3035888671875, -1.26446533203125, -1.225341796875, -1.18621826171875, -1.1470947265625, -1.10797119140625, -1.06884765625, -1.02972412109375, -0.9906005859375, -0.95147705078125, -0.912353515625, -0.87322998046875, -0.8341064453125, -0.79498291015625, -0.755859375, -0.71673583984375, -0.6776123046875, -0.63848876953125, -0.599365234375, -0.56024169921875, -0.5211181640625, -0.48199462890625, -0.44287109375, -0.40374755859375, -0.3646240234375, -0.32550048828125, -0.286376953125, -0.24725341796875, -0.2081298828125, -0.16900634765625, -0.1298828125, -0.09075927734375, -0.0516357421875, -0.01251220703125, 0.026611328125, 0.06573486328125, 0.1048583984375, 0.14398193359375, 0.18310546875, 0.22222900390625, 0.2613525390625, 0.30047607421875, 0.339599609375, 0.37872314453125, 0.4178466796875, 0.45697021484375, 0.49609375, 0.53521728515625, 0.5743408203125, 0.61346435546875, 0.652587890625, 0.69171142578125, 0.7308349609375, 0.76995849609375, 0.80908203125, 0.84820556640625, 0.8873291015625, 0.92645263671875, 0.965576171875, 1.00469970703125, 1.0438232421875, 1.08294677734375, 1.1220703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 17.0, 26.0, 39.0, 52.0, 74.0, 100.0, 113.0, 146.0, 216.0, 296.0, 432.0, 540.0, 820.0, 1245.0, 1816.0, 3049.0, 5212.0, 10296.0, 25688.0, 854346.0, 3239453.0, 25768.0, 10387.0, 5231.0, 3016.0, 1764.0, 1183.0, 795.0, 558.0, 386.0, 303.0, 184.0, 182.0, 131.0, 89.0, 69.0, 57.0, 39.0, 36.0, 21.0, 17.0, 14.0, 11.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.9375, -5.76287841796875, -5.5882568359375, -5.41363525390625, -5.239013671875, -5.06439208984375, -4.8897705078125, -4.71514892578125, -4.54052734375, -4.36590576171875, -4.1912841796875, -4.01666259765625, -3.842041015625, -3.66741943359375, -3.4927978515625, -3.31817626953125, -3.1435546875, -2.96893310546875, -2.7943115234375, -2.61968994140625, -2.445068359375, -2.27044677734375, -2.0958251953125, -1.92120361328125, -1.74658203125, -1.57196044921875, -1.3973388671875, -1.22271728515625, -1.048095703125, -0.87347412109375, -0.6988525390625, -0.52423095703125, -0.349609375, -0.17498779296875, -0.0003662109375, 0.17425537109375, 0.348876953125, 0.52349853515625, 0.6981201171875, 0.87274169921875, 1.04736328125, 1.22198486328125, 1.3966064453125, 1.57122802734375, 1.745849609375, 1.92047119140625, 2.0950927734375, 2.26971435546875, 2.4443359375, 2.61895751953125, 2.7935791015625, 2.96820068359375, 3.142822265625, 3.31744384765625, 3.4920654296875, 3.66668701171875, 3.84130859375, 4.01593017578125, 4.1905517578125, 4.36517333984375, 4.539794921875, 4.71441650390625, 4.8890380859375, 5.06365966796875, 5.23828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 9.0, 10.0, 12.0, 12.0, 23.0, 71.0, 3711.0, 94.0, 40.0, 28.0, 15.0, 7.0, 11.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.137420654296875, -2.07171630859375, -2.006011962890625, -1.9403076171875, -1.874603271484375, -1.80889892578125, -1.743194580078125, -1.677490234375, -1.611785888671875, -1.54608154296875, -1.480377197265625, -1.4146728515625, -1.348968505859375, -1.28326416015625, -1.217559814453125, -1.15185546875, -1.086151123046875, -1.02044677734375, -0.954742431640625, -0.8890380859375, -0.823333740234375, -0.75762939453125, -0.691925048828125, -0.626220703125, -0.560516357421875, -0.49481201171875, -0.429107666015625, -0.3634033203125, -0.297698974609375, -0.23199462890625, -0.166290283203125, -0.1005859375, -0.034881591796875, 0.03082275390625, 0.096527099609375, 0.1622314453125, 0.227935791015625, 0.29364013671875, 0.359344482421875, 0.425048828125, 0.490753173828125, 0.55645751953125, 0.622161865234375, 0.6878662109375, 0.753570556640625, 0.81927490234375, 0.884979248046875, 0.95068359375, 1.016387939453125, 1.08209228515625, 1.147796630859375, 1.2135009765625, 1.279205322265625, 1.34490966796875, 1.410614013671875, 1.476318359375, 1.542022705078125, 1.60772705078125, 1.673431396484375, 1.7391357421875, 1.804840087890625, 1.87054443359375, 1.936248779296875, 2.001953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 18.0, 26.0, 36.0, 78.0, 91.0, 144.0, 144.0, 99.0, 105.0, 63.0, 47.0, 28.0, 23.0, 11.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044249534606934, -7.791569709777832, -7.538889408111572, -7.286209583282471, -7.033529281616211, -6.780849456787109, -6.528169631958008, -6.275489807128906, -6.0228095054626465, -5.770129680633545, -5.517449378967285, -5.264769554138184, -5.012089729309082, -4.759409427642822, -4.506729602813721, -4.254049301147461, -4.001369476318359, -3.7486894130706787, -3.496009349822998, -3.2433295249938965, -2.990649461746216, -2.737969398498535, -2.4852895736694336, -2.232609510421753, -1.9799294471740723, -1.7272493839263916, -1.4745694398880005, -1.2218894958496094, -0.9692094326019287, -0.716529369354248, -0.46384942531585693, -0.21116948127746582, 0.04150962829589844, 0.2941896319389343, 0.5468696355819702, 0.7995496392250061, 1.052229642868042, 1.3049097061157227, 1.5575896501541138, 1.8102695941925049, 2.0629496574401855, 2.315629720687866, 2.568309783935547, 2.8209896087646484, 3.073669672012329, 3.3263497352600098, 3.5790295600891113, 3.831709623336792, 4.084389686584473, 4.337069511413574, 4.589749813079834, 4.8424296379089355, 5.095109939575195, 5.347789764404297, 5.600469589233398, 5.8531494140625, 6.10582971572876, 6.358509540557861, 6.611189842224121, 6.863869667053223, 7.116549491882324, 7.369229793548584, 7.6219096183776855, 7.874589920043945, 8.127269744873047]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 14.0, 8.0, 23.0, 16.0, 16.0, 16.0, 20.0, 14.0, 22.0, 25.0, 29.0, 32.0, 29.0, 33.0, 38.0, 49.0, 38.0, 43.0, 45.0, 39.0, 44.0, 43.0, 35.0, 38.0, 32.0, 35.0, 29.0, 26.0, 23.0, 25.0, 18.0, 12.0, 9.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.204047203063965, -5.041396141052246, -4.878745079040527, -4.716094017028809, -4.55344295501709, -4.390791893005371, -4.228140830993652, -4.065489768981934, -3.9028384685516357, -3.740187406539917, -3.5775363445281982, -3.4148852825164795, -3.2522339820861816, -3.089582920074463, -2.926931858062744, -2.7642807960510254, -2.6016297340393066, -2.438978672027588, -2.276327610015869, -2.1136765480041504, -1.951025366783142, -1.7883743047714233, -1.625723123550415, -1.4630720615386963, -1.3004209995269775, -1.1377699375152588, -0.9751188158988953, -0.8124676942825317, -0.649816632270813, -0.48716557025909424, -0.3245144486427307, -0.1618633270263672, 0.0007877349853515625, 0.1634388267993927, 0.32608991861343384, 0.488741010427475, 0.6513921022415161, 0.8140431642532349, 0.9766942858695984, 1.139345407485962, 1.3019964694976807, 1.4646475315093994, 1.6272985935211182, 1.7899497747421265, 1.9526008367538452, 2.1152520179748535, 2.2779030799865723, 2.440554141998291, 2.6032052040100098, 2.7658562660217285, 2.9285073280334473, 3.091158390045166, 3.2538094520568848, 3.4164605140686035, 3.5791118144989014, 3.74176287651062, 3.904413938522339, 4.067065238952637, 4.2297163009643555, 4.392367362976074, 4.555018424987793, 4.717669486999512, 4.8803205490112305, 5.042971611022949, 5.205622673034668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 12.0, 10.0, 14.0, 25.0, 27.0, 40.0, 69.0, 76.0, 145.0, 188.0, 321.0, 508.0, 747.0, 1360.0, 2433.0, 4817.0, 10013.0, 23870.0, 68408.0, 266204.0, 474316.0, 126769.0, 38578.0, 14852.0, 6771.0, 3392.0, 1807.0, 1003.0, 616.0, 368.0, 259.0, 150.0, 94.0, 70.0, 69.0, 40.0, 27.0, 16.0, 19.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.166015625, -3.070770263671875, -2.97552490234375, -2.880279541015625, -2.7850341796875, -2.689788818359375, -2.59454345703125, -2.499298095703125, -2.404052734375, -2.308807373046875, -2.21356201171875, -2.118316650390625, -2.0230712890625, -1.927825927734375, -1.83258056640625, -1.737335205078125, -1.64208984375, -1.546844482421875, -1.45159912109375, -1.356353759765625, -1.2611083984375, -1.165863037109375, -1.07061767578125, -0.975372314453125, -0.880126953125, -0.784881591796875, -0.68963623046875, -0.594390869140625, -0.4991455078125, -0.403900146484375, -0.30865478515625, -0.213409423828125, -0.1181640625, -0.022918701171875, 0.07232666015625, 0.167572021484375, 0.2628173828125, 0.358062744140625, 0.45330810546875, 0.548553466796875, 0.643798828125, 0.739044189453125, 0.83428955078125, 0.929534912109375, 1.0247802734375, 1.120025634765625, 1.21527099609375, 1.310516357421875, 1.40576171875, 1.501007080078125, 1.59625244140625, 1.691497802734375, 1.7867431640625, 1.881988525390625, 1.97723388671875, 2.072479248046875, 2.167724609375, 2.262969970703125, 2.35821533203125, 2.453460693359375, 2.5487060546875, 2.643951416015625, 2.73919677734375, 2.834442138671875, 2.9296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 2.0, 4.0, 7.0, 16.0, 12.0, 17.0, 22.0, 35.0, 35.0, 47.0, 40.0, 69.0, 72.0, 99.0, 85.0, 87.0, 72.0, 50.0, 40.0, 49.0, 39.0, 33.0, 17.0, 14.0, 9.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5146484375, -1.4702911376953125, -1.425933837890625, -1.3815765380859375, -1.33721923828125, -1.2928619384765625, -1.248504638671875, -1.2041473388671875, -1.1597900390625, -1.1154327392578125, -1.071075439453125, -1.0267181396484375, -0.98236083984375, -0.9380035400390625, -0.893646240234375, -0.8492889404296875, -0.804931640625, -0.7605743408203125, -0.716217041015625, -0.6718597412109375, -0.62750244140625, -0.5831451416015625, -0.538787841796875, -0.4944305419921875, -0.4500732421875, -0.4057159423828125, -0.361358642578125, -0.3170013427734375, -0.27264404296875, -0.2282867431640625, -0.183929443359375, -0.1395721435546875, -0.09521484375, -0.0508575439453125, -0.006500244140625, 0.0378570556640625, 0.08221435546875, 0.1265716552734375, 0.170928955078125, 0.2152862548828125, 0.2596435546875, 0.3040008544921875, 0.348358154296875, 0.3927154541015625, 0.43707275390625, 0.4814300537109375, 0.525787353515625, 0.5701446533203125, 0.614501953125, 0.6588592529296875, 0.703216552734375, 0.7475738525390625, 0.79193115234375, 0.8362884521484375, 0.880645751953125, 0.9250030517578125, 0.9693603515625, 1.0137176513671875, 1.058074951171875, 1.1024322509765625, 1.14678955078125, 1.1911468505859375, 1.235504150390625, 1.2798614501953125, 1.32421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 8.0, 5.0, 26.0, 49.0, 54.0, 106.0, 196.0, 355.0, 742.0, 1703.0, 4871.0, 19662.0, 164109.0, 769441.0, 69662.0, 11596.0, 3437.0, 1235.0, 570.0, 297.0, 159.0, 100.0, 51.0, 40.0, 28.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.795166015625, -7.52001953125, -7.244873046875, -6.9697265625, -6.694580078125, -6.41943359375, -6.144287109375, -5.869140625, -5.593994140625, -5.31884765625, -5.043701171875, -4.7685546875, -4.493408203125, -4.21826171875, -3.943115234375, -3.66796875, -3.392822265625, -3.11767578125, -2.842529296875, -2.5673828125, -2.292236328125, -2.01708984375, -1.741943359375, -1.466796875, -1.191650390625, -0.91650390625, -0.641357421875, -0.3662109375, -0.091064453125, 0.18408203125, 0.459228515625, 0.734375, 1.009521484375, 1.28466796875, 1.559814453125, 1.8349609375, 2.110107421875, 2.38525390625, 2.660400390625, 2.935546875, 3.210693359375, 3.48583984375, 3.760986328125, 4.0361328125, 4.311279296875, 4.58642578125, 4.861572265625, 5.13671875, 5.411865234375, 5.68701171875, 5.962158203125, 6.2373046875, 6.512451171875, 6.78759765625, 7.062744140625, 7.337890625, 7.613037109375, 7.88818359375, 8.163330078125, 8.4384765625, 8.713623046875, 8.98876953125, 9.263916015625, 9.5390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 8.0, 19.0, 12.0, 16.0, 23.0, 41.0, 47.0, 58.0, 47.0, 71.0, 84.0, 96.0, 75.0, 71.0, 49.0, 50.0, 43.0, 33.0, 37.0, 18.0, 22.0, 9.0, 13.0, 10.0, 10.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6796875, -9.35302734375, -9.0263671875, -8.69970703125, -8.373046875, -8.04638671875, -7.7197265625, -7.39306640625, -7.06640625, -6.73974609375, -6.4130859375, -6.08642578125, -5.759765625, -5.43310546875, -5.1064453125, -4.77978515625, -4.453125, -4.12646484375, -3.7998046875, -3.47314453125, -3.146484375, -2.81982421875, -2.4931640625, -2.16650390625, -1.83984375, -1.51318359375, -1.1865234375, -0.85986328125, -0.533203125, -0.20654296875, 0.1201171875, 0.44677734375, 0.7734375, 1.10009765625, 1.4267578125, 1.75341796875, 2.080078125, 2.40673828125, 2.7333984375, 3.06005859375, 3.38671875, 3.71337890625, 4.0400390625, 4.36669921875, 4.693359375, 5.02001953125, 5.3466796875, 5.67333984375, 6.0, 6.32666015625, 6.6533203125, 6.97998046875, 7.306640625, 7.63330078125, 7.9599609375, 8.28662109375, 8.61328125, 8.93994140625, 9.2666015625, 9.59326171875, 9.919921875, 10.24658203125, 10.5732421875, 10.89990234375, 11.2265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 4.0, 15.0, 14.0, 32.0, 59.0, 75.0, 141.0, 285.0, 751.0, 3179.0, 137673.0, 898530.0, 5919.0, 1046.0, 382.0, 163.0, 104.0, 58.0, 38.0, 30.0, 12.0, 14.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.162109375, -9.85546875, -9.548828125, -9.2421875, -8.935546875, -8.62890625, -8.322265625, -8.015625, -7.708984375, -7.40234375, -7.095703125, -6.7890625, -6.482421875, -6.17578125, -5.869140625, -5.5625, -5.255859375, -4.94921875, -4.642578125, -4.3359375, -4.029296875, -3.72265625, -3.416015625, -3.109375, -2.802734375, -2.49609375, -2.189453125, -1.8828125, -1.576171875, -1.26953125, -0.962890625, -0.65625, -0.349609375, -0.04296875, 0.263671875, 0.5703125, 0.876953125, 1.18359375, 1.490234375, 1.796875, 2.103515625, 2.41015625, 2.716796875, 3.0234375, 3.330078125, 3.63671875, 3.943359375, 4.25, 4.556640625, 4.86328125, 5.169921875, 5.4765625, 5.783203125, 6.08984375, 6.396484375, 6.703125, 7.009765625, 7.31640625, 7.623046875, 7.9296875, 8.236328125, 8.54296875, 8.849609375, 9.15625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 14.0, 38.0, 65.0, 153.0, 278.0, 221.0, 126.0, 49.0, 25.0, 14.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.0006571859121322632, -0.0006344020366668701, -0.000611618161201477, -0.000588834285736084, -0.0005660504102706909, -0.0005432665348052979, -0.0005204826593399048, -0.0004976987838745117, -0.00047491490840911865, -0.0004521310329437256, -0.0004293471574783325, -0.00040656328201293945, -0.0003837794065475464, -0.0003609955310821533, -0.00033821165561676025, -0.0003154277801513672, -0.0002926439046859741, -0.00026986002922058105, -0.000247076153755188, -0.00022429227828979492, -0.00020150840282440186, -0.0001787245273590088, -0.00015594065189361572, -0.00013315677642822266, -0.00011037290096282959, -8.758902549743652e-05, -6.480515003204346e-05, -4.202127456665039e-05, -1.9237399101257324e-05, 3.546476364135742e-06, 2.633035182952881e-05, 4.9114227294921875e-05, 7.189810276031494e-05, 9.468197822570801e-05, 0.00011746585369110107, 0.00014024972915649414, 0.0001630336046218872, 0.00018581748008728027, 0.00020860135555267334, 0.0002313852310180664, 0.00025416910648345947, 0.00027695298194885254, 0.0002997368574142456, 0.00032252073287963867, 0.00034530460834503174, 0.0003680884838104248, 0.00039087235927581787, 0.00041365623474121094, 0.000436440110206604, 0.00045922398567199707, 0.00048200786113739014, 0.0005047917366027832, 0.0005275756120681763, 0.0005503594875335693, 0.0005731433629989624, 0.0005959272384643555, 0.0006187111139297485, 0.0006414949893951416, 0.0006642788648605347, 0.0006870627403259277, 0.0007098466157913208, 0.0007326304912567139, 0.0007554143667221069, 0.0007781982421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 15.0, 19.0, 22.0, 47.0, 107.0, 168.0, 350.0, 827.0, 2188.0, 8513.0, 81563.0, 896578.0, 48473.0, 6427.0, 1879.0, 693.0, 303.0, 158.0, 81.0, 47.0, 30.0, 11.0, 9.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.89453125, -4.7523193359375, -4.610107421875, -4.4678955078125, -4.32568359375, -4.1834716796875, -4.041259765625, -3.8990478515625, -3.7568359375, -3.6146240234375, -3.472412109375, -3.3302001953125, -3.18798828125, -3.0457763671875, -2.903564453125, -2.7613525390625, -2.619140625, -2.4769287109375, -2.334716796875, -2.1925048828125, -2.05029296875, -1.9080810546875, -1.765869140625, -1.6236572265625, -1.4814453125, -1.3392333984375, -1.197021484375, -1.0548095703125, -0.91259765625, -0.7703857421875, -0.628173828125, -0.4859619140625, -0.34375, -0.2015380859375, -0.059326171875, 0.0828857421875, 0.22509765625, 0.3673095703125, 0.509521484375, 0.6517333984375, 0.7939453125, 0.9361572265625, 1.078369140625, 1.2205810546875, 1.36279296875, 1.5050048828125, 1.647216796875, 1.7894287109375, 1.931640625, 2.0738525390625, 2.216064453125, 2.3582763671875, 2.50048828125, 2.6427001953125, 2.784912109375, 2.9271240234375, 3.0693359375, 3.2115478515625, 3.353759765625, 3.4959716796875, 3.63818359375, 3.7803955078125, 3.922607421875, 4.0648193359375, 4.20703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 21.0, 23.0, 56.0, 144.0, 245.0, 243.0, 141.0, 61.0, 27.0, 10.0, 4.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.4990234375, -5.294921875, -5.0908203125, -4.88671875, -4.6826171875, -4.478515625, -4.2744140625, -4.0703125, -3.8662109375, -3.662109375, -3.4580078125, -3.25390625, -3.0498046875, -2.845703125, -2.6416015625, -2.4375, -2.2333984375, -2.029296875, -1.8251953125, -1.62109375, -1.4169921875, -1.212890625, -1.0087890625, -0.8046875, -0.6005859375, -0.396484375, -0.1923828125, 0.01171875, 0.2158203125, 0.419921875, 0.6240234375, 0.828125, 1.0322265625, 1.236328125, 1.4404296875, 1.64453125, 1.8486328125, 2.052734375, 2.2568359375, 2.4609375, 2.6650390625, 2.869140625, 3.0732421875, 3.27734375, 3.4814453125, 3.685546875, 3.8896484375, 4.09375, 4.2978515625, 4.501953125, 4.7060546875, 4.91015625, 5.1142578125, 5.318359375, 5.5224609375, 5.7265625, 5.9306640625, 6.134765625, 6.3388671875, 6.54296875, 6.7470703125, 6.951171875, 7.1552734375, 7.359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 10.0, 5.0, 9.0, 22.0, 24.0, 32.0, 59.0, 65.0, 110.0, 118.0, 132.0, 112.0, 94.0, 72.0, 37.0, 32.0, 17.0, 16.0, 11.0, 10.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.40155029296875, -56.9228630065918, -55.44417953491211, -53.965492248535156, -52.48680877685547, -51.008121490478516, -49.52943420410156, -48.050750732421875, -46.57206344604492, -45.09337615966797, -43.61469268798828, -42.13600540161133, -40.657318115234375, -39.17863464355469, -37.699947357177734, -36.22126007080078, -34.742576599121094, -33.26388931274414, -31.785205841064453, -30.3065185546875, -28.82783317565918, -27.34914779663086, -25.870460510253906, -24.391775131225586, -22.913089752197266, -21.434404373168945, -19.955718994140625, -18.477031707763672, -16.99834632873535, -15.519660949707031, -14.040974617004395, -12.562288284301758, -11.083602905273438, -9.604917526245117, -8.12623119354248, -6.647545337677002, -5.168859481811523, -3.690173625946045, -2.2114877700805664, -0.7328014373779297, 0.7458839416503906, 2.224569797515869, 3.7032556533813477, 5.181941509246826, 6.660627365112305, 8.139312744140625, 9.617999076843262, 11.096685409545898, 12.575370788574219, 14.054056167602539, 15.532742500305176, 17.011428833007812, 18.490114212036133, 19.968799591064453, 21.447486877441406, 22.926172256469727, 24.404857635498047, 25.883543014526367, 27.362228393554688, 28.84091567993164, 30.31960105895996, 31.79828643798828, 33.276973724365234, 34.75566101074219, 36.234344482421875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 10.0, 6.0, 11.0, 17.0, 15.0, 23.0, 23.0, 22.0, 36.0, 40.0, 44.0, 49.0, 59.0, 57.0, 71.0, 65.0, 58.0, 56.0, 47.0, 53.0, 55.0, 34.0, 22.0, 25.0, 13.0, 15.0, 14.0, 8.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.012306213378906, -50.55244827270508, -49.09259033203125, -47.63273239135742, -46.172874450683594, -44.713016510009766, -43.25315856933594, -41.79330062866211, -40.33344268798828, -38.87358474731445, -37.413726806640625, -35.9538688659668, -34.49401092529297, -33.03415298461914, -31.574295043945312, -30.114437103271484, -28.654577255249023, -27.194719314575195, -25.734861373901367, -24.27500343322754, -22.81514549255371, -21.355287551879883, -19.895427703857422, -18.435569763183594, -16.975711822509766, -15.515853881835938, -14.05599594116211, -12.596138000488281, -11.136280059814453, -9.676422119140625, -8.21656322479248, -6.756705284118652, -5.296848297119141, -3.8369903564453125, -2.3771321773529053, -0.917273998260498, 0.5425839424133301, 2.002441883087158, 3.4623003005981445, 4.922158241271973, 6.382016181945801, 7.841874122619629, 9.301732063293457, 10.761590957641602, 12.22144889831543, 13.681306838989258, 15.141164779663086, 16.601022720336914, 18.060880661010742, 19.52073860168457, 20.9805965423584, 22.440454483032227, 23.900312423706055, 25.360170364379883, 26.820030212402344, 28.279888153076172, 29.73974609375, 31.199604034423828, 32.659461975097656, 34.119319915771484, 35.57917785644531, 37.03903579711914, 38.49889373779297, 39.9587516784668, 41.418609619140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 11.0, 8.0, 10.0, 17.0, 23.0, 45.0, 69.0, 106.0, 212.0, 399.0, 1073.0, 4646.0, 4179404.0, 6065.0, 1262.0, 440.0, 211.0, 103.0, 63.0, 35.0, 27.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.177978515625, -27.46533203125, -26.752685546875, -26.0400390625, -25.327392578125, -24.61474609375, -23.902099609375, -23.189453125, -22.476806640625, -21.76416015625, -21.051513671875, -20.3388671875, -19.626220703125, -18.91357421875, -18.200927734375, -17.48828125, -16.775634765625, -16.06298828125, -15.350341796875, -14.6376953125, -13.925048828125, -13.21240234375, -12.499755859375, -11.787109375, -11.074462890625, -10.36181640625, -9.649169921875, -8.9365234375, -8.223876953125, -7.51123046875, -6.798583984375, -6.0859375, -5.373291015625, -4.66064453125, -3.947998046875, -3.2353515625, -2.522705078125, -1.81005859375, -1.097412109375, -0.384765625, 0.327880859375, 1.04052734375, 1.753173828125, 2.4658203125, 3.178466796875, 3.89111328125, 4.603759765625, 5.31640625, 6.029052734375, 6.74169921875, 7.454345703125, 8.1669921875, 8.879638671875, 9.59228515625, 10.304931640625, 11.017578125, 11.730224609375, 12.44287109375, 13.155517578125, 13.8681640625, 14.580810546875, 15.29345703125, 16.006103515625, 16.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 15.0, 20.0, 38.0, 49.0, 81.0, 111.0, 152.0, 151.0, 128.0, 73.0, 45.0, 41.0, 21.0, 14.0, 5.0, 15.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.23248291015625, -3.1368408203125, -3.04119873046875, -2.945556640625, -2.84991455078125, -2.7542724609375, -2.65863037109375, -2.56298828125, -2.46734619140625, -2.3717041015625, -2.27606201171875, -2.180419921875, -2.08477783203125, -1.9891357421875, -1.89349365234375, -1.7978515625, -1.70220947265625, -1.6065673828125, -1.51092529296875, -1.415283203125, -1.31964111328125, -1.2239990234375, -1.12835693359375, -1.03271484375, -0.93707275390625, -0.8414306640625, -0.74578857421875, -0.650146484375, -0.55450439453125, -0.4588623046875, -0.36322021484375, -0.267578125, -0.17193603515625, -0.0762939453125, 0.01934814453125, 0.114990234375, 0.21063232421875, 0.3062744140625, 0.40191650390625, 0.49755859375, 0.59320068359375, 0.6888427734375, 0.78448486328125, 0.880126953125, 0.97576904296875, 1.0714111328125, 1.16705322265625, 1.2626953125, 1.35833740234375, 1.4539794921875, 1.54962158203125, 1.645263671875, 1.74090576171875, 1.8365478515625, 1.93218994140625, 2.02783203125, 2.12347412109375, 2.2191162109375, 2.31475830078125, 2.410400390625, 2.50604248046875, 2.6016845703125, 2.69732666015625, 2.79296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 5.0, 9.0, 12.0, 23.0, 33.0, 39.0, 37.0, 49.0, 83.0, 106.0, 149.0, 167.0, 237.0, 323.0, 462.0, 685.0, 1075.0, 2079.0, 7041.0, 4152728.0, 21295.0, 3340.0, 1452.0, 855.0, 560.0, 400.0, 295.0, 200.0, 137.0, 101.0, 73.0, 63.0, 44.0, 18.0, 24.0, 18.0, 18.0, 9.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.375, -18.817138671875, -18.25927734375, -17.701416015625, -17.1435546875, -16.585693359375, -16.02783203125, -15.469970703125, -14.912109375, -14.354248046875, -13.79638671875, -13.238525390625, -12.6806640625, -12.122802734375, -11.56494140625, -11.007080078125, -10.44921875, -9.891357421875, -9.33349609375, -8.775634765625, -8.2177734375, -7.659912109375, -7.10205078125, -6.544189453125, -5.986328125, -5.428466796875, -4.87060546875, -4.312744140625, -3.7548828125, -3.197021484375, -2.63916015625, -2.081298828125, -1.5234375, -0.965576171875, -0.40771484375, 0.150146484375, 0.7080078125, 1.265869140625, 1.82373046875, 2.381591796875, 2.939453125, 3.497314453125, 4.05517578125, 4.613037109375, 5.1708984375, 5.728759765625, 6.28662109375, 6.844482421875, 7.40234375, 7.960205078125, 8.51806640625, 9.075927734375, 9.6337890625, 10.191650390625, 10.74951171875, 11.307373046875, 11.865234375, 12.423095703125, 12.98095703125, 13.538818359375, 14.0966796875, 14.654541015625, 15.21240234375, 15.770263671875, 16.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 10.0, 10.0, 104.0, 3906.0, 30.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.652984619140625, -4.52081298828125, -4.388641357421875, -4.2564697265625, -4.124298095703125, -3.99212646484375, -3.859954833984375, -3.727783203125, -3.595611572265625, -3.46343994140625, -3.331268310546875, -3.1990966796875, -3.066925048828125, -2.93475341796875, -2.802581787109375, -2.67041015625, -2.538238525390625, -2.40606689453125, -2.273895263671875, -2.1417236328125, -2.009552001953125, -1.87738037109375, -1.745208740234375, -1.613037109375, -1.480865478515625, -1.34869384765625, -1.216522216796875, -1.0843505859375, -0.952178955078125, -0.82000732421875, -0.687835693359375, -0.5556640625, -0.423492431640625, -0.29132080078125, -0.159149169921875, -0.0269775390625, 0.105194091796875, 0.23736572265625, 0.369537353515625, 0.501708984375, 0.633880615234375, 0.76605224609375, 0.898223876953125, 1.0303955078125, 1.162567138671875, 1.29473876953125, 1.426910400390625, 1.55908203125, 1.691253662109375, 1.82342529296875, 1.955596923828125, 2.0877685546875, 2.219940185546875, 2.35211181640625, 2.484283447265625, 2.616455078125, 2.748626708984375, 2.88079833984375, 3.012969970703125, 3.1451416015625, 3.277313232421875, 3.40948486328125, 3.541656494140625, 3.673828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 8.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 27.0, 29.0, 33.0, 49.0, 62.0, 88.0, 123.0, 122.0, 121.0, 87.0, 56.0, 37.0, 31.0, 18.0, 19.0, 14.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.563186645507812, -8.302862167358398, -8.042536735534668, -7.782212257385254, -7.521887302398682, -7.261562347412109, -7.001237869262695, -6.740912914276123, -6.480587959289551, -6.2202630043029785, -5.9599385261535645, -5.699613571166992, -5.43928861618042, -5.178963661193848, -4.918639183044434, -4.658314228057861, -4.397989749908447, -4.137664794921875, -3.877340078353882, -3.6170153617858887, -3.3566904067993164, -3.0963656902313232, -2.83604097366333, -2.575716018676758, -2.3153913021087646, -2.0550665855407715, -1.7947416305541992, -1.534416913986206, -1.2740920782089233, -1.0137672424316406, -0.7534425258636475, -0.49311769008636475, -0.23279285430908203, 0.027531951665878296, 0.2878567576408386, 0.5481815338134766, 0.8085063695907593, 1.068831205368042, 1.3291559219360352, 1.5894807577133179, 1.8498055934906006, 2.1101303100585938, 2.370455265045166, 2.630779981613159, 2.8911046981811523, 3.1514296531677246, 3.4117543697357178, 3.672079086303711, 3.932404041290283, 4.1927289962768555, 4.4530534744262695, 4.713378429412842, 4.973703384399414, 5.234027862548828, 5.4943528175354, 5.754677772521973, 6.015002250671387, 6.275327205657959, 6.535651683807373, 6.795976638793945, 7.056301593780518, 7.31662654876709, 7.576951026916504, 7.837275981903076, 8.097600936889648]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 13.0, 4.0, 11.0, 15.0, 12.0, 17.0, 21.0, 19.0, 33.0, 28.0, 33.0, 42.0, 42.0, 42.0, 36.0, 47.0, 32.0, 39.0, 44.0, 43.0, 29.0, 48.0, 44.0, 29.0, 29.0, 35.0, 26.0, 27.0, 20.0, 30.0, 12.0, 19.0, 12.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.181884288787842, -5.013457775115967, -4.84503173828125, -4.676605224609375, -4.5081787109375, -4.339752197265625, -4.17132568359375, -4.002899646759033, -3.834473133087158, -3.666046619415283, -3.4976203441619873, -3.3291940689086914, -3.1607675552368164, -2.9923410415649414, -2.8239147663116455, -2.6554884910583496, -2.4870619773864746, -2.3186354637145996, -2.1502091884613037, -1.9817827939987183, -1.8133563995361328, -1.6449300050735474, -1.476503610610962, -1.3080772161483765, -1.139650821685791, -0.9712244272232056, -0.8027980327606201, -0.6343716382980347, -0.4659452438354492, -0.29751884937286377, -0.12909245491027832, 0.03933393955230713, 0.20776081085205078, 0.37618720531463623, 0.5446135997772217, 0.7130399942398071, 0.8814663887023926, 1.049892783164978, 1.2183191776275635, 1.386745572090149, 1.5551719665527344, 1.7235983610153198, 1.8920247554779053, 2.060451030731201, 2.228877544403076, 2.397304058074951, 2.565730333328247, 2.734156608581543, 2.902583122253418, 3.071009635925293, 3.239435911178589, 3.4078621864318848, 3.5762887001037598, 3.7447152137756348, 3.9131414890289307, 4.081567764282227, 4.249994277954102, 4.418420791625977, 4.586847305297852, 4.755273342132568, 4.923699855804443, 5.092126369476318, 5.260552406311035, 5.42897891998291, 5.597405433654785]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 11.0, 11.0, 16.0, 19.0, 25.0, 45.0, 65.0, 100.0, 117.0, 189.0, 286.0, 458.0, 745.0, 1236.0, 2125.0, 4062.0, 8860.0, 23143.0, 77170.0, 410671.0, 402437.0, 75388.0, 22773.0, 8931.0, 4200.0, 2113.0, 1178.0, 774.0, 473.0, 288.0, 199.0, 119.0, 93.0, 58.0, 45.0, 40.0, 24.0, 17.0, 9.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.91015625, -4.77374267578125, -4.6373291015625, -4.50091552734375, -4.364501953125, -4.22808837890625, -4.0916748046875, -3.95526123046875, -3.81884765625, -3.68243408203125, -3.5460205078125, -3.40960693359375, -3.273193359375, -3.13677978515625, -3.0003662109375, -2.86395263671875, -2.7275390625, -2.59112548828125, -2.4547119140625, -2.31829833984375, -2.181884765625, -2.04547119140625, -1.9090576171875, -1.77264404296875, -1.63623046875, -1.49981689453125, -1.3634033203125, -1.22698974609375, -1.090576171875, -0.95416259765625, -0.8177490234375, -0.68133544921875, -0.544921875, -0.40850830078125, -0.2720947265625, -0.13568115234375, 0.000732421875, 0.13714599609375, 0.2735595703125, 0.40997314453125, 0.54638671875, 0.68280029296875, 0.8192138671875, 0.95562744140625, 1.092041015625, 1.22845458984375, 1.3648681640625, 1.50128173828125, 1.6376953125, 1.77410888671875, 1.9105224609375, 2.04693603515625, 2.183349609375, 2.31976318359375, 2.4561767578125, 2.59259033203125, 2.72900390625, 2.86541748046875, 3.0018310546875, 3.13824462890625, 3.274658203125, 3.41107177734375, 3.5474853515625, 3.68389892578125, 3.8203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 3.0, 12.0, 19.0, 12.0, 18.0, 35.0, 52.0, 56.0, 84.0, 83.0, 103.0, 119.0, 83.0, 72.0, 56.0, 50.0, 36.0, 18.0, 15.0, 17.0, 7.0, 6.0, 2.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.537109375, -2.459625244140625, -2.38214111328125, -2.304656982421875, -2.2271728515625, -2.149688720703125, -2.07220458984375, -1.994720458984375, -1.917236328125, -1.839752197265625, -1.76226806640625, -1.684783935546875, -1.6072998046875, -1.529815673828125, -1.45233154296875, -1.374847412109375, -1.29736328125, -1.219879150390625, -1.14239501953125, -1.064910888671875, -0.9874267578125, -0.909942626953125, -0.83245849609375, -0.754974365234375, -0.677490234375, -0.600006103515625, -0.52252197265625, -0.445037841796875, -0.3675537109375, -0.290069580078125, -0.21258544921875, -0.135101318359375, -0.0576171875, 0.019866943359375, 0.09735107421875, 0.174835205078125, 0.2523193359375, 0.329803466796875, 0.40728759765625, 0.484771728515625, 0.562255859375, 0.639739990234375, 0.71722412109375, 0.794708251953125, 0.8721923828125, 0.949676513671875, 1.02716064453125, 1.104644775390625, 1.18212890625, 1.259613037109375, 1.33709716796875, 1.414581298828125, 1.4920654296875, 1.569549560546875, 1.64703369140625, 1.724517822265625, 1.802001953125, 1.879486083984375, 1.95697021484375, 2.034454345703125, 2.1119384765625, 2.189422607421875, 2.26690673828125, 2.344390869140625, 2.421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 6.0, 6.0, 9.0, 8.0, 16.0, 18.0, 23.0, 47.0, 71.0, 103.0, 204.0, 289.0, 612.0, 1439.0, 4029.0, 14423.0, 80200.0, 713534.0, 196831.0, 26291.0, 6315.0, 2150.0, 893.0, 439.0, 246.0, 123.0, 88.0, 40.0, 44.0, 18.0, 18.0, 12.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.6737060546875, -6.441162109375, -6.2086181640625, -5.97607421875, -5.7435302734375, -5.510986328125, -5.2784423828125, -5.0458984375, -4.8133544921875, -4.580810546875, -4.3482666015625, -4.11572265625, -3.8831787109375, -3.650634765625, -3.4180908203125, -3.185546875, -2.9530029296875, -2.720458984375, -2.4879150390625, -2.25537109375, -2.0228271484375, -1.790283203125, -1.5577392578125, -1.3251953125, -1.0926513671875, -0.860107421875, -0.6275634765625, -0.39501953125, -0.1624755859375, 0.070068359375, 0.3026123046875, 0.53515625, 0.7677001953125, 1.000244140625, 1.2327880859375, 1.46533203125, 1.6978759765625, 1.930419921875, 2.1629638671875, 2.3955078125, 2.6280517578125, 2.860595703125, 3.0931396484375, 3.32568359375, 3.5582275390625, 3.790771484375, 4.0233154296875, 4.255859375, 4.4884033203125, 4.720947265625, 4.9534912109375, 5.18603515625, 5.4185791015625, 5.651123046875, 5.8836669921875, 6.1162109375, 6.3487548828125, 6.581298828125, 6.8138427734375, 7.04638671875, 7.2789306640625, 7.511474609375, 7.7440185546875, 7.9765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 9.0, 15.0, 13.0, 22.0, 23.0, 27.0, 27.0, 37.0, 27.0, 47.0, 43.0, 53.0, 53.0, 58.0, 62.0, 48.0, 47.0, 49.0, 50.0, 45.0, 33.0, 41.0, 36.0, 26.0, 20.0, 17.0, 12.0, 8.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8265380859375, -8.535888671875, -8.2452392578125, -7.95458984375, -7.6639404296875, -7.373291015625, -7.0826416015625, -6.7919921875, -6.5013427734375, -6.210693359375, -5.9200439453125, -5.62939453125, -5.3387451171875, -5.048095703125, -4.7574462890625, -4.466796875, -4.1761474609375, -3.885498046875, -3.5948486328125, -3.30419921875, -3.0135498046875, -2.722900390625, -2.4322509765625, -2.1416015625, -1.8509521484375, -1.560302734375, -1.2696533203125, -0.97900390625, -0.6883544921875, -0.397705078125, -0.1070556640625, 0.18359375, 0.4742431640625, 0.764892578125, 1.0555419921875, 1.34619140625, 1.6368408203125, 1.927490234375, 2.2181396484375, 2.5087890625, 2.7994384765625, 3.090087890625, 3.3807373046875, 3.67138671875, 3.9620361328125, 4.252685546875, 4.5433349609375, 4.833984375, 5.1246337890625, 5.415283203125, 5.7059326171875, 5.99658203125, 6.2872314453125, 6.577880859375, 6.8685302734375, 7.1591796875, 7.4498291015625, 7.740478515625, 8.0311279296875, 8.32177734375, 8.6124267578125, 8.903076171875, 9.1937255859375, 9.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 20.0, 36.0, 35.0, 66.0, 147.0, 345.0, 2151.0, 138741.0, 901422.0, 4703.0, 482.0, 160.0, 89.0, 51.0, 33.0, 18.0, 10.0, 8.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -12.0401611328125, -11.697509765625, -11.3548583984375, -11.01220703125, -10.6695556640625, -10.326904296875, -9.9842529296875, -9.6416015625, -9.2989501953125, -8.956298828125, -8.6136474609375, -8.27099609375, -7.9283447265625, -7.585693359375, -7.2430419921875, -6.900390625, -6.5577392578125, -6.215087890625, -5.8724365234375, -5.52978515625, -5.1871337890625, -4.844482421875, -4.5018310546875, -4.1591796875, -3.8165283203125, -3.473876953125, -3.1312255859375, -2.78857421875, -2.4459228515625, -2.103271484375, -1.7606201171875, -1.41796875, -1.0753173828125, -0.732666015625, -0.3900146484375, -0.04736328125, 0.2952880859375, 0.637939453125, 0.9805908203125, 1.3232421875, 1.6658935546875, 2.008544921875, 2.3511962890625, 2.69384765625, 3.0364990234375, 3.379150390625, 3.7218017578125, 4.064453125, 4.4071044921875, 4.749755859375, 5.0924072265625, 5.43505859375, 5.7777099609375, 6.120361328125, 6.4630126953125, 6.8056640625, 7.1483154296875, 7.490966796875, 7.8336181640625, 8.17626953125, 8.5189208984375, 8.861572265625, 9.2042236328125, 9.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 13.0, 35.0, 60.0, 174.0, 279.0, 238.0, 95.0, 48.0, 29.0, 12.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003571510314941406, -0.0003290101885795593, -0.00030086934566497803, -0.00027272850275039673, -0.00024458765983581543, -0.00021644681692123413, -0.00018830597400665283, -0.00016016513109207153, -0.00013202428817749023, -0.00010388344526290894, -7.574260234832764e-05, -4.760175943374634e-05, -1.946091651916504e-05, 8.67992639541626e-06, 3.682076930999756e-05, 6.496161222457886e-05, 9.310245513916016e-05, 0.00012124329805374146, 0.00014938414096832275, 0.00017752498388290405, 0.00020566582679748535, 0.00023380666971206665, 0.00026194751262664795, 0.00029008835554122925, 0.00031822919845581055, 0.00034637004137039185, 0.00037451088428497314, 0.00040265172719955444, 0.00043079257011413574, 0.00045893341302871704, 0.00048707425594329834, 0.0005152150988578796, 0.0005433559417724609, 0.0005714967846870422, 0.0005996376276016235, 0.0006277784705162048, 0.0006559193134307861, 0.0006840601563453674, 0.0007122009992599487, 0.00074034184217453, 0.0007684826850891113, 0.0007966235280036926, 0.0008247643709182739, 0.0008529052138328552, 0.0008810460567474365, 0.0009091868996620178, 0.0009373277425765991, 0.0009654685854911804, 0.0009936094284057617, 0.001021750271320343, 0.0010498911142349243, 0.0010780319571495056, 0.001106172800064087, 0.0011343136429786682, 0.0011624544858932495, 0.0011905953288078308, 0.0012187361717224121, 0.0012468770146369934, 0.0012750178575515747, 0.001303158700466156, 0.0013312995433807373, 0.0013594403862953186, 0.0013875812292099, 0.0014157220721244812, 0.0014438629150390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 15.0, 6.0, 10.0, 24.0, 40.0, 73.0, 156.0, 350.0, 952.0, 3859.0, 32671.0, 845179.0, 152809.0, 9679.0, 1720.0, 551.0, 220.0, 95.0, 65.0, 27.0, 20.0, 14.0, 7.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.749755859375, -5.59326171875, -5.436767578125, -5.2802734375, -5.123779296875, -4.96728515625, -4.810791015625, -4.654296875, -4.497802734375, -4.34130859375, -4.184814453125, -4.0283203125, -3.871826171875, -3.71533203125, -3.558837890625, -3.40234375, -3.245849609375, -3.08935546875, -2.932861328125, -2.7763671875, -2.619873046875, -2.46337890625, -2.306884765625, -2.150390625, -1.993896484375, -1.83740234375, -1.680908203125, -1.5244140625, -1.367919921875, -1.21142578125, -1.054931640625, -0.8984375, -0.741943359375, -0.58544921875, -0.428955078125, -0.2724609375, -0.115966796875, 0.04052734375, 0.197021484375, 0.353515625, 0.510009765625, 0.66650390625, 0.822998046875, 0.9794921875, 1.135986328125, 1.29248046875, 1.448974609375, 1.60546875, 1.761962890625, 1.91845703125, 2.074951171875, 2.2314453125, 2.387939453125, 2.54443359375, 2.700927734375, 2.857421875, 3.013916015625, 3.17041015625, 3.326904296875, 3.4833984375, 3.639892578125, 3.79638671875, 3.952880859375, 4.109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 9.0, 16.0, 22.0, 34.0, 35.0, 55.0, 86.0, 107.0, 139.0, 141.0, 105.0, 52.0, 53.0, 37.0, 33.0, 19.0, 11.0, 15.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.799957275390625, -3.68780517578125, -3.575653076171875, -3.4635009765625, -3.351348876953125, -3.23919677734375, -3.127044677734375, -3.014892578125, -2.902740478515625, -2.79058837890625, -2.678436279296875, -2.5662841796875, -2.454132080078125, -2.34197998046875, -2.229827880859375, -2.11767578125, -2.005523681640625, -1.89337158203125, -1.781219482421875, -1.6690673828125, -1.556915283203125, -1.44476318359375, -1.332611083984375, -1.220458984375, -1.108306884765625, -0.99615478515625, -0.884002685546875, -0.7718505859375, -0.659698486328125, -0.54754638671875, -0.435394287109375, -0.3232421875, -0.211090087890625, -0.09893798828125, 0.013214111328125, 0.1253662109375, 0.237518310546875, 0.34967041015625, 0.461822509765625, 0.573974609375, 0.686126708984375, 0.79827880859375, 0.910430908203125, 1.0225830078125, 1.134735107421875, 1.24688720703125, 1.359039306640625, 1.47119140625, 1.583343505859375, 1.69549560546875, 1.807647705078125, 1.9197998046875, 2.031951904296875, 2.14410400390625, 2.256256103515625, 2.368408203125, 2.480560302734375, 2.59271240234375, 2.704864501953125, 2.8170166015625, 2.929168701171875, 3.04132080078125, 3.153472900390625, 3.265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 15.0, 19.0, 12.0, 38.0, 71.0, 120.0, 160.0, 162.0, 166.0, 107.0, 47.0, 37.0, 20.0, 11.0, 4.0, 3.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.06126403808594, -82.25242614746094, -80.44358825683594, -78.63475036621094, -76.82591247558594, -75.01707458496094, -73.20823669433594, -71.39939880371094, -69.59056091308594, -67.78172302246094, -65.97288513183594, -64.16404724121094, -62.35520935058594, -60.54637145996094, -58.73753356933594, -56.92869567871094, -55.1198616027832, -53.3110237121582, -51.5021858215332, -49.6933479309082, -47.8845100402832, -46.0756721496582, -44.26683807373047, -42.45800018310547, -40.64916229248047, -38.84032440185547, -37.03148651123047, -35.22264862060547, -33.41381072998047, -31.60497283935547, -29.7961368560791, -27.9872989654541, -26.17845916748047, -24.36962127685547, -22.56078338623047, -20.75194549560547, -18.94310760498047, -17.13426971435547, -15.325433731079102, -13.516595840454102, -11.707757949829102, -9.898920059204102, -8.090082168579102, -6.281245231628418, -4.472407341003418, -2.663569450378418, -0.8547325134277344, 0.9541053771972656, 2.7629432678222656, 4.571781158447266, 6.380618572235107, 8.18945598602295, 9.99829387664795, 11.80713176727295, 13.615968704223633, 15.424806594848633, 17.233644485473633, 19.042482376098633, 20.851320266723633, 22.66015625, 24.468994140625, 26.27783203125, 28.086669921875, 29.8955078125, 31.704345703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 15.0, 20.0, 21.0, 18.0, 22.0, 35.0, 41.0, 55.0, 66.0, 65.0, 66.0, 82.0, 91.0, 59.0, 55.0, 65.0, 44.0, 36.0, 26.0, 31.0, 19.0, 15.0, 13.0, 11.0, 12.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.64944839477539, -61.10551071166992, -59.56157302856445, -58.017635345458984, -56.473697662353516, -54.92975616455078, -53.38581848144531, -51.841880798339844, -50.297943115234375, -48.754005432128906, -47.21006774902344, -45.66613006591797, -44.1221923828125, -42.57825469970703, -41.03431701660156, -39.49037551879883, -37.946441650390625, -36.402503967285156, -34.85856628417969, -33.31462860107422, -31.770689010620117, -30.22675132751465, -28.68281364440918, -27.138874053955078, -25.59493637084961, -24.05099868774414, -22.507061004638672, -20.963123321533203, -19.4191837310791, -17.875246047973633, -16.331308364868164, -14.787369728088379, -13.243431091308594, -11.699493408203125, -10.15555477142334, -8.611617088317871, -7.067678928375244, -5.523740768432617, -3.9798030853271484, -2.4358644485473633, -0.8919267654418945, 0.6520112752914429, 2.1959493160247803, 3.739887237548828, 5.283825397491455, 6.827763557434082, 8.37170124053955, 9.915639877319336, 11.459577560424805, 13.003515243530273, 14.547453880310059, 16.091392517089844, 17.635330200195312, 19.17926788330078, 20.72320556640625, 22.26714324951172, 23.811080932617188, 25.355018615722656, 26.898956298828125, 28.442893981933594, 29.986833572387695, 31.530771255493164, 33.07470703125, 34.618648529052734, 36.1625862121582]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 17.0, 18.0, 25.0, 38.0, 63.0, 93.0, 151.0, 254.0, 493.0, 1264.0, 4178.0, 237030.0, 3943385.0, 4932.0, 1275.0, 484.0, 230.0, 128.0, 63.0, 48.0, 28.0, 14.0, 11.0, 2.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.84375, -25.2696533203125, -24.695556640625, -24.1214599609375, -23.54736328125, -22.9732666015625, -22.399169921875, -21.8250732421875, -21.2509765625, -20.6768798828125, -20.102783203125, -19.5286865234375, -18.95458984375, -18.3804931640625, -17.806396484375, -17.2322998046875, -16.658203125, -16.0841064453125, -15.510009765625, -14.9359130859375, -14.36181640625, -13.7877197265625, -13.213623046875, -12.6395263671875, -12.0654296875, -11.4913330078125, -10.917236328125, -10.3431396484375, -9.76904296875, -9.1949462890625, -8.620849609375, -8.0467529296875, -7.47265625, -6.8985595703125, -6.324462890625, -5.7503662109375, -5.17626953125, -4.6021728515625, -4.028076171875, -3.4539794921875, -2.8798828125, -2.3057861328125, -1.731689453125, -1.1575927734375, -0.58349609375, -0.0093994140625, 0.564697265625, 1.1387939453125, 1.712890625, 2.2869873046875, 2.861083984375, 3.4351806640625, 4.00927734375, 4.5833740234375, 5.157470703125, 5.7315673828125, 6.3056640625, 6.8797607421875, 7.453857421875, 8.0279541015625, 8.60205078125, 9.1761474609375, 9.750244140625, 10.3243408203125, 10.8984375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 14.0, 13.0, 18.0, 42.0, 97.0, 133.0, 206.0, 184.0, 129.0, 69.0, 36.0, 16.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5625, -6.41204833984375, -6.2615966796875, -6.11114501953125, -5.960693359375, -5.81024169921875, -5.6597900390625, -5.50933837890625, -5.35888671875, -5.20843505859375, -5.0579833984375, -4.90753173828125, -4.757080078125, -4.60662841796875, -4.4561767578125, -4.30572509765625, -4.1552734375, -4.00482177734375, -3.8543701171875, -3.70391845703125, -3.553466796875, -3.40301513671875, -3.2525634765625, -3.10211181640625, -2.95166015625, -2.80120849609375, -2.6507568359375, -2.50030517578125, -2.349853515625, -2.19940185546875, -2.0489501953125, -1.89849853515625, -1.748046875, -1.59759521484375, -1.4471435546875, -1.29669189453125, -1.146240234375, -0.99578857421875, -0.8453369140625, -0.69488525390625, -0.54443359375, -0.39398193359375, -0.2435302734375, -0.09307861328125, 0.057373046875, 0.20782470703125, 0.3582763671875, 0.50872802734375, 0.6591796875, 0.80963134765625, 0.9600830078125, 1.11053466796875, 1.260986328125, 1.41143798828125, 1.5618896484375, 1.71234130859375, 1.86279296875, 2.01324462890625, 2.1636962890625, 2.31414794921875, 2.464599609375, 2.61505126953125, 2.7655029296875, 2.91595458984375, 3.06640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 13.0, 12.0, 17.0, 22.0, 35.0, 25.0, 25.0, 39.0, 67.0, 95.0, 101.0, 127.0, 171.0, 275.0, 404.0, 587.0, 910.0, 1547.0, 2523.0, 4651.0, 9694.0, 34678.0, 4063449.0, 50742.0, 11156.0, 5144.0, 2781.0, 1749.0, 1058.0, 633.0, 430.0, 339.0, 195.0, 128.0, 112.0, 87.0, 74.0, 51.0, 26.0, 24.0, 17.0, 18.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.5234375, -8.2447509765625, -7.966064453125, -7.6873779296875, -7.40869140625, -7.1300048828125, -6.851318359375, -6.5726318359375, -6.2939453125, -6.0152587890625, -5.736572265625, -5.4578857421875, -5.17919921875, -4.9005126953125, -4.621826171875, -4.3431396484375, -4.064453125, -3.7857666015625, -3.507080078125, -3.2283935546875, -2.94970703125, -2.6710205078125, -2.392333984375, -2.1136474609375, -1.8349609375, -1.5562744140625, -1.277587890625, -0.9989013671875, -0.72021484375, -0.4415283203125, -0.162841796875, 0.1158447265625, 0.39453125, 0.6732177734375, 0.951904296875, 1.2305908203125, 1.50927734375, 1.7879638671875, 2.066650390625, 2.3453369140625, 2.6240234375, 2.9027099609375, 3.181396484375, 3.4600830078125, 3.73876953125, 4.0174560546875, 4.296142578125, 4.5748291015625, 4.853515625, 5.1322021484375, 5.410888671875, 5.6895751953125, 5.96826171875, 6.2469482421875, 6.525634765625, 6.8043212890625, 7.0830078125, 7.3616943359375, 7.640380859375, 7.9190673828125, 8.19775390625, 8.4764404296875, 8.755126953125, 9.0338134765625, 9.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 6.0, 6.0, 10.0, 16.0, 34.0, 168.0, 3671.0, 68.0, 36.0, 15.0, 11.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.96649169921875, -4.8079833984375, -4.64947509765625, -4.490966796875, -4.33245849609375, -4.1739501953125, -4.01544189453125, -3.85693359375, -3.69842529296875, -3.5399169921875, -3.38140869140625, -3.222900390625, -3.06439208984375, -2.9058837890625, -2.74737548828125, -2.5888671875, -2.43035888671875, -2.2718505859375, -2.11334228515625, -1.954833984375, -1.79632568359375, -1.6378173828125, -1.47930908203125, -1.32080078125, -1.16229248046875, -1.0037841796875, -0.84527587890625, -0.686767578125, -0.52825927734375, -0.3697509765625, -0.21124267578125, -0.052734375, 0.10577392578125, 0.2642822265625, 0.42279052734375, 0.581298828125, 0.73980712890625, 0.8983154296875, 1.05682373046875, 1.21533203125, 1.37384033203125, 1.5323486328125, 1.69085693359375, 1.849365234375, 2.00787353515625, 2.1663818359375, 2.32489013671875, 2.4833984375, 2.64190673828125, 2.8004150390625, 2.95892333984375, 3.117431640625, 3.27593994140625, 3.4344482421875, 3.59295654296875, 3.75146484375, 3.90997314453125, 4.0684814453125, 4.22698974609375, 4.385498046875, 4.54400634765625, 4.7025146484375, 4.86102294921875, 5.01953125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 9.0, 6.0, 10.0, 12.0, 19.0, 17.0, 27.0, 35.0, 47.0, 64.0, 78.0, 91.0, 96.0, 74.0, 72.0, 63.0, 62.0, 40.0, 30.0, 18.0, 12.0, 13.0, 20.0, 15.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.592257499694824, -9.307798385620117, -9.023338317871094, -8.738879203796387, -8.454419136047363, -8.169960021972656, -7.885500431060791, -7.601040840148926, -7.3165812492370605, -7.032121658325195, -6.74766206741333, -6.463202476501465, -6.178743362426758, -5.894283294677734, -5.609824180603027, -5.325364589691162, -5.040904998779297, -4.756445407867432, -4.471985816955566, -4.187526226043701, -3.903066873550415, -3.61860728263855, -3.3341479301452637, -3.0496883392333984, -2.765228748321533, -2.480769157409668, -2.1963095664978027, -1.9118502140045166, -1.6273906230926514, -1.3429310321807861, -1.0584715604782104, -0.7740120887756348, -0.48955345153808594, -0.20509392023086548, 0.07936561107635498, 0.36382514238357544, 0.6482846736907959, 0.9327442646026611, 1.2172037363052368, 1.5016632080078125, 1.7861227989196777, 2.070582389831543, 2.355041980743408, 2.6395013332366943, 2.9239609241485596, 3.208420515060425, 3.492879867553711, 3.777339458465576, 4.061799049377441, 4.346258640289307, 4.630718231201172, 4.915177822113037, 5.199637413024902, 5.484096527099609, 5.768556118011475, 6.05301570892334, 6.337475299835205, 6.62193489074707, 6.9063944816589355, 7.190854072570801, 7.475313186645508, 7.759773254394531, 8.044232368469238, 8.328691482543945, 8.613151550292969]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 9.0, 16.0, 10.0, 15.0, 27.0, 19.0, 24.0, 36.0, 39.0, 27.0, 46.0, 49.0, 40.0, 53.0, 56.0, 51.0, 58.0, 61.0, 48.0, 49.0, 36.0, 41.0, 34.0, 28.0, 29.0, 16.0, 14.0, 14.0, 12.0, 7.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.650160789489746, -7.321600437164307, -6.993040084838867, -6.664480209350586, -6.3359198570251465, -6.007359504699707, -5.678799629211426, -5.350239276885986, -5.021678924560547, -4.693118572235107, -4.364558219909668, -4.035998344421387, -3.7074379920959473, -3.378877639770508, -3.0503175258636475, -2.721757411956787, -2.3931970596313477, -2.064636707305908, -1.7360765933990479, -1.407516360282898, -1.078956127166748, -0.7503958940505981, -0.42183566093444824, -0.09327554702758789, 0.23528480529785156, 0.5638450384140015, 0.8924052715301514, 1.2209655046463013, 1.5495257377624512, 1.878085970878601, 2.206646203994751, 2.5352063179016113, 2.863767623901367, 3.1923279762268066, 3.520888090133667, 3.8494482040405273, 4.178008556365967, 4.506568908691406, 4.8351287841796875, 5.163689136505127, 5.492249488830566, 5.820809841156006, 6.149370193481445, 6.477930068969727, 6.806490421295166, 7.1350507736206055, 7.463610649108887, 7.792171001434326, 8.120731353759766, 8.449291229248047, 8.777852058410645, 9.106411933898926, 9.434972763061523, 9.763532638549805, 10.092092514038086, 10.420652389526367, 10.749213218688965, 11.077773094177246, 11.406333923339844, 11.734893798828125, 12.063453674316406, 12.392014503479004, 12.720574378967285, 13.049135208129883, 13.377695083618164]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 16.0, 20.0, 24.0, 37.0, 75.0, 100.0, 141.0, 275.0, 440.0, 945.0, 2310.0, 6237.0, 24865.0, 175979.0, 716032.0, 96516.0, 16356.0, 4628.0, 1752.0, 782.0, 407.0, 226.0, 136.0, 83.0, 43.0, 31.0, 17.0, 23.0, 15.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.671875, -8.3765869140625, -8.081298828125, -7.7860107421875, -7.49072265625, -7.1954345703125, -6.900146484375, -6.6048583984375, -6.3095703125, -6.0142822265625, -5.718994140625, -5.4237060546875, -5.12841796875, -4.8331298828125, -4.537841796875, -4.2425537109375, -3.947265625, -3.6519775390625, -3.356689453125, -3.0614013671875, -2.76611328125, -2.4708251953125, -2.175537109375, -1.8802490234375, -1.5849609375, -1.2896728515625, -0.994384765625, -0.6990966796875, -0.40380859375, -0.1085205078125, 0.186767578125, 0.4820556640625, 0.77734375, 1.0726318359375, 1.367919921875, 1.6632080078125, 1.95849609375, 2.2537841796875, 2.549072265625, 2.8443603515625, 3.1396484375, 3.4349365234375, 3.730224609375, 4.0255126953125, 4.32080078125, 4.6160888671875, 4.911376953125, 5.2066650390625, 5.501953125, 5.7972412109375, 6.092529296875, 6.3878173828125, 6.68310546875, 6.9783935546875, 7.273681640625, 7.5689697265625, 7.8642578125, 8.1595458984375, 8.454833984375, 8.7501220703125, 9.04541015625, 9.3406982421875, 9.635986328125, 9.9312744140625, 10.2265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 8.0, 9.0, 19.0, 9.0, 38.0, 52.0, 60.0, 95.0, 111.0, 133.0, 118.0, 106.0, 86.0, 57.0, 34.0, 18.0, 16.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.453765869140625, -4.34112548828125, -4.228485107421875, -4.1158447265625, -4.003204345703125, -3.89056396484375, -3.777923583984375, -3.665283203125, -3.552642822265625, -3.44000244140625, -3.327362060546875, -3.2147216796875, -3.102081298828125, -2.98944091796875, -2.876800537109375, -2.76416015625, -2.651519775390625, -2.53887939453125, -2.426239013671875, -2.3135986328125, -2.200958251953125, -2.08831787109375, -1.975677490234375, -1.863037109375, -1.750396728515625, -1.63775634765625, -1.525115966796875, -1.4124755859375, -1.299835205078125, -1.18719482421875, -1.074554443359375, -0.9619140625, -0.849273681640625, -0.73663330078125, -0.623992919921875, -0.5113525390625, -0.398712158203125, -0.28607177734375, -0.173431396484375, -0.060791015625, 0.051849365234375, 0.16448974609375, 0.277130126953125, 0.3897705078125, 0.502410888671875, 0.61505126953125, 0.727691650390625, 0.84033203125, 0.952972412109375, 1.06561279296875, 1.178253173828125, 1.2908935546875, 1.403533935546875, 1.51617431640625, 1.628814697265625, 1.741455078125, 1.854095458984375, 1.96673583984375, 2.079376220703125, 2.1920166015625, 2.304656982421875, 2.41729736328125, 2.529937744140625, 2.642578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 14.0, 14.0, 22.0, 57.0, 64.0, 112.0, 188.0, 425.0, 971.0, 2596.0, 9127.0, 51313.0, 663415.0, 284894.0, 26185.0, 5811.0, 1858.0, 727.0, 312.0, 171.0, 110.0, 59.0, 25.0, 19.0, 23.0, 9.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -6.935546875, -6.64453125, -6.353515625, -6.0625, -5.771484375, -5.48046875, -5.189453125, -4.8984375, -4.607421875, -4.31640625, -4.025390625, -3.734375, -3.443359375, -3.15234375, -2.861328125, -2.5703125, -2.279296875, -1.98828125, -1.697265625, -1.40625, -1.115234375, -0.82421875, -0.533203125, -0.2421875, 0.048828125, 0.33984375, 0.630859375, 0.921875, 1.212890625, 1.50390625, 1.794921875, 2.0859375, 2.376953125, 2.66796875, 2.958984375, 3.25, 3.541015625, 3.83203125, 4.123046875, 4.4140625, 4.705078125, 4.99609375, 5.287109375, 5.578125, 5.869140625, 6.16015625, 6.451171875, 6.7421875, 7.033203125, 7.32421875, 7.615234375, 7.90625, 8.197265625, 8.48828125, 8.779296875, 9.0703125, 9.361328125, 9.65234375, 9.943359375, 10.234375, 10.525390625, 10.81640625, 11.107421875, 11.3984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 5.0, 8.0, 6.0, 6.0, 14.0, 12.0, 13.0, 20.0, 24.0, 23.0, 29.0, 39.0, 51.0, 39.0, 53.0, 50.0, 52.0, 52.0, 49.0, 49.0, 37.0, 53.0, 48.0, 41.0, 49.0, 39.0, 18.0, 19.0, 15.0, 20.0, 9.0, 10.0, 6.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9140625, -7.65771484375, -7.4013671875, -7.14501953125, -6.888671875, -6.63232421875, -6.3759765625, -6.11962890625, -5.86328125, -5.60693359375, -5.3505859375, -5.09423828125, -4.837890625, -4.58154296875, -4.3251953125, -4.06884765625, -3.8125, -3.55615234375, -3.2998046875, -3.04345703125, -2.787109375, -2.53076171875, -2.2744140625, -2.01806640625, -1.76171875, -1.50537109375, -1.2490234375, -0.99267578125, -0.736328125, -0.47998046875, -0.2236328125, 0.03271484375, 0.2890625, 0.54541015625, 0.8017578125, 1.05810546875, 1.314453125, 1.57080078125, 1.8271484375, 2.08349609375, 2.33984375, 2.59619140625, 2.8525390625, 3.10888671875, 3.365234375, 3.62158203125, 3.8779296875, 4.13427734375, 4.390625, 4.64697265625, 4.9033203125, 5.15966796875, 5.416015625, 5.67236328125, 5.9287109375, 6.18505859375, 6.44140625, 6.69775390625, 6.9541015625, 7.21044921875, 7.466796875, 7.72314453125, 7.9794921875, 8.23583984375, 8.4921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 17.0, 38.0, 53.0, 113.0, 262.0, 679.0, 2848.0, 35391.0, 948779.0, 55400.0, 3633.0, 781.0, 257.0, 132.0, 65.0, 39.0, 19.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.215423583984375, -3.04217529296875, -2.868927001953125, -2.6956787109375, -2.522430419921875, -2.34918212890625, -2.175933837890625, -2.002685546875, -1.829437255859375, -1.65618896484375, -1.482940673828125, -1.3096923828125, -1.136444091796875, -0.96319580078125, -0.789947509765625, -0.61669921875, -0.443450927734375, -0.27020263671875, -0.096954345703125, 0.0762939453125, 0.249542236328125, 0.42279052734375, 0.596038818359375, 0.769287109375, 0.942535400390625, 1.11578369140625, 1.289031982421875, 1.4622802734375, 1.635528564453125, 1.80877685546875, 1.982025146484375, 2.1552734375, 2.328521728515625, 2.50177001953125, 2.675018310546875, 2.8482666015625, 3.021514892578125, 3.19476318359375, 3.368011474609375, 3.541259765625, 3.714508056640625, 3.88775634765625, 4.061004638671875, 4.2342529296875, 4.407501220703125, 4.58074951171875, 4.753997802734375, 4.92724609375, 5.100494384765625, 5.27374267578125, 5.446990966796875, 5.6202392578125, 5.793487548828125, 5.96673583984375, 6.139984130859375, 6.313232421875, 6.486480712890625, 6.65972900390625, 6.832977294921875, 7.0062255859375, 7.179473876953125, 7.35272216796875, 7.525970458984375, 7.69921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 10.0, 19.0, 27.0, 38.0, 72.0, 107.0, 168.0, 171.0, 153.0, 93.0, 50.0, 24.0, 25.0, 15.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.0009245872497558594, -0.0009065326303243637, -0.000888478010892868, -0.0008704233914613724, -0.0008523687720298767, -0.000834314152598381, -0.0008162595331668854, -0.0007982049137353897, -0.000780150294303894, -0.0007620956748723984, -0.0007440410554409027, -0.000725986436009407, -0.0007079318165779114, -0.0006898771971464157, -0.00067182257771492, -0.0006537679582834244, -0.0006357133388519287, -0.000617658719420433, -0.0005996040999889374, -0.0005815494805574417, -0.000563494861125946, -0.0005454402416944504, -0.0005273856222629547, -0.000509331002831459, -0.0004912763833999634, -0.0004732217639684677, -0.00045516714453697205, -0.0004371125251054764, -0.0004190579056739807, -0.00040100328624248505, -0.0003829486668109894, -0.0003648940473794937, -0.00034683942794799805, -0.0003287848085165024, -0.0003107301890850067, -0.00029267556965351105, -0.0002746209502220154, -0.0002565663307905197, -0.00023851171135902405, -0.00022045709192752838, -0.00020240247249603271, -0.00018434785306453705, -0.00016629323363304138, -0.00014823861420154572, -0.00013018399477005005, -0.00011212937533855438, -9.407475590705872e-05, -7.602013647556305e-05, -5.796551704406738e-05, -3.9910897612571716e-05, -2.185627818107605e-05, -3.8016587495803833e-06, 1.4252960681915283e-05, 3.230758011341095e-05, 5.0362199544906616e-05, 6.841681897640228e-05, 8.647143840789795e-05, 0.00010452605783939362, 0.00012258067727088928, 0.00014063529670238495, 0.00015868991613388062, 0.00017674453556537628, 0.00019479915499687195, 0.00021285377442836761, 0.00023090839385986328]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 13.0, 18.0, 49.0, 85.0, 151.0, 281.0, 660.0, 1852.0, 10784.0, 400015.0, 617954.0, 13158.0, 2134.0, 703.0, 286.0, 163.0, 88.0, 50.0, 32.0, 19.0, 13.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.09808349609375, -3.9344482421875, -3.77081298828125, -3.607177734375, -3.44354248046875, -3.2799072265625, -3.11627197265625, -2.95263671875, -2.78900146484375, -2.6253662109375, -2.46173095703125, -2.298095703125, -2.13446044921875, -1.9708251953125, -1.80718994140625, -1.6435546875, -1.47991943359375, -1.3162841796875, -1.15264892578125, -0.989013671875, -0.82537841796875, -0.6617431640625, -0.49810791015625, -0.33447265625, -0.17083740234375, -0.0072021484375, 0.15643310546875, 0.320068359375, 0.48370361328125, 0.6473388671875, 0.81097412109375, 0.974609375, 1.13824462890625, 1.3018798828125, 1.46551513671875, 1.629150390625, 1.79278564453125, 1.9564208984375, 2.12005615234375, 2.28369140625, 2.44732666015625, 2.6109619140625, 2.77459716796875, 2.938232421875, 3.10186767578125, 3.2655029296875, 3.42913818359375, 3.5927734375, 3.75640869140625, 3.9200439453125, 4.08367919921875, 4.247314453125, 4.41094970703125, 4.5745849609375, 4.73822021484375, 4.90185546875, 5.06549072265625, 5.2291259765625, 5.39276123046875, 5.556396484375, 5.72003173828125, 5.8836669921875, 6.04730224609375, 6.2109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 11.0, 29.0, 44.0, 82.0, 143.0, 202.0, 192.0, 144.0, 70.0, 37.0, 20.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.08319091796875, -3.9046630859375, -3.72613525390625, -3.547607421875, -3.36907958984375, -3.1905517578125, -3.01202392578125, -2.83349609375, -2.65496826171875, -2.4764404296875, -2.29791259765625, -2.119384765625, -1.94085693359375, -1.7623291015625, -1.58380126953125, -1.4052734375, -1.22674560546875, -1.0482177734375, -0.86968994140625, -0.691162109375, -0.51263427734375, -0.3341064453125, -0.15557861328125, 0.02294921875, 0.20147705078125, 0.3800048828125, 0.55853271484375, 0.737060546875, 0.91558837890625, 1.0941162109375, 1.27264404296875, 1.451171875, 1.62969970703125, 1.8082275390625, 1.98675537109375, 2.165283203125, 2.34381103515625, 2.5223388671875, 2.70086669921875, 2.87939453125, 3.05792236328125, 3.2364501953125, 3.41497802734375, 3.593505859375, 3.77203369140625, 3.9505615234375, 4.12908935546875, 4.3076171875, 4.48614501953125, 4.6646728515625, 4.84320068359375, 5.021728515625, 5.20025634765625, 5.3787841796875, 5.55731201171875, 5.73583984375, 5.91436767578125, 6.0928955078125, 6.27142333984375, 6.449951171875, 6.62847900390625, 6.8070068359375, 6.98553466796875, 7.1640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 19.0, 33.0, 92.0, 135.0, 223.0, 223.0, 137.0, 63.0, 30.0, 20.0, 13.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.38458251953125, -88.84367370605469, -86.30276489257812, -83.76185607910156, -81.220947265625, -78.68003845214844, -76.13912963867188, -73.59822082519531, -71.05731201171875, -68.51640319824219, -65.97549438476562, -63.43458557128906, -60.8936767578125, -58.35276794433594, -55.81186294555664, -53.27095413208008, -50.73004913330078, -48.18914031982422, -45.648231506347656, -43.107322692871094, -40.56641387939453, -38.02550506591797, -35.48460006713867, -32.94369125366211, -30.402782440185547, -27.861873626708984, -25.320964813232422, -22.780057907104492, -20.23914909362793, -17.698240280151367, -15.157332420349121, -12.616424560546875, -10.075515747070312, -7.534607410430908, -4.993699073791504, -2.4527907371520996, 0.08811759948730469, 2.629026412963867, 5.169934272766113, 7.710842132568359, 10.251750946044922, 12.792659759521484, 15.33356761932373, 17.874475479125977, 20.41538429260254, 22.9562931060791, 25.49720001220703, 28.038108825683594, 30.579017639160156, 33.11992645263672, 35.66083526611328, 38.201744079589844, 40.742652893066406, 43.28356170654297, 45.824466705322266, 48.36537551879883, 50.90628433227539, 53.44719314575195, 55.988101959228516, 58.52901077270508, 61.069915771484375, 63.61082458496094, 66.1517333984375, 68.69264221191406, 71.23355102539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 9.0, 13.0, 9.0, 19.0, 21.0, 29.0, 22.0, 47.0, 30.0, 42.0, 35.0, 41.0, 60.0, 46.0, 64.0, 50.0, 56.0, 48.0, 40.0, 40.0, 36.0, 36.0, 27.0, 26.0, 22.0, 24.0, 16.0, 10.0, 10.0, 8.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.66944885253906, -32.45766830444336, -31.245887756347656, -30.034107208251953, -28.82232666015625, -27.610546112060547, -26.398767471313477, -25.186986923217773, -23.97520637512207, -22.763425827026367, -21.551645278930664, -20.33986473083496, -19.12808609008789, -17.916305541992188, -16.704524993896484, -15.492744445800781, -14.280963897705078, -13.069183349609375, -11.857402801513672, -10.645623207092285, -9.433842658996582, -8.222062110900879, -7.010282039642334, -5.798501968383789, -4.586721420288086, -3.374941110610962, -2.163160800933838, -0.9513804912567139, 0.26039981842041016, 1.4721803665161133, 2.683960437774658, 3.895740509033203, 5.107517242431641, 6.319297790527344, 7.531077861785889, 8.742857933044434, 9.954638481140137, 11.16641902923584, 12.378198623657227, 13.58997917175293, 14.801759719848633, 16.013540267944336, 17.22532081604004, 18.437101364135742, 19.648880004882812, 20.860660552978516, 22.07244110107422, 23.284221649169922, 24.496002197265625, 25.707782745361328, 26.91956329345703, 28.131343841552734, 29.343124389648438, 30.55490493774414, 31.76668357849121, 32.97846221923828, 34.19024658203125, 35.40202713012695, 36.613807678222656, 37.82558822631836, 39.03736877441406, 40.249149322509766, 41.46092987060547, 42.672706604003906, 43.88448715209961]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 20.0, 25.0, 33.0, 52.0, 64.0, 108.0, 139.0, 211.0, 321.0, 476.0, 753.0, 1224.0, 2244.0, 3945.0, 7834.0, 17937.0, 54871.0, 661695.0, 3295261.0, 98078.0, 26706.0, 10828.0, 5038.0, 2603.0, 1479.0, 854.0, 525.0, 298.0, 221.0, 156.0, 74.0, 51.0, 53.0, 20.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.99609375, -3.871917724609375, -3.74774169921875, -3.623565673828125, -3.4993896484375, -3.375213623046875, -3.25103759765625, -3.126861572265625, -3.002685546875, -2.878509521484375, -2.75433349609375, -2.630157470703125, -2.5059814453125, -2.381805419921875, -2.25762939453125, -2.133453369140625, -2.00927734375, -1.885101318359375, -1.76092529296875, -1.636749267578125, -1.5125732421875, -1.388397216796875, -1.26422119140625, -1.140045166015625, -1.015869140625, -0.891693115234375, -0.76751708984375, -0.643341064453125, -0.5191650390625, -0.394989013671875, -0.27081298828125, -0.146636962890625, -0.0224609375, 0.101715087890625, 0.22589111328125, 0.350067138671875, 0.4742431640625, 0.598419189453125, 0.72259521484375, 0.846771240234375, 0.970947265625, 1.095123291015625, 1.21929931640625, 1.343475341796875, 1.4676513671875, 1.591827392578125, 1.71600341796875, 1.840179443359375, 1.96435546875, 2.088531494140625, 2.21270751953125, 2.336883544921875, 2.4610595703125, 2.585235595703125, 2.70941162109375, 2.833587646484375, 2.957763671875, 3.081939697265625, 3.20611572265625, 3.330291748046875, 3.4544677734375, 3.578643798828125, 3.70281982421875, 3.826995849609375, 3.951171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 8.0, 9.0, 10.0, 13.0, 12.0, 23.0, 19.0, 36.0, 35.0, 46.0, 57.0, 70.0, 48.0, 80.0, 81.0, 68.0, 61.0, 65.0, 50.0, 39.0, 33.0, 22.0, 24.0, 15.0, 15.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.510955810546875, -1.45550537109375, -1.400054931640625, -1.3446044921875, -1.289154052734375, -1.23370361328125, -1.178253173828125, -1.122802734375, -1.067352294921875, -1.01190185546875, -0.956451416015625, -0.9010009765625, -0.845550537109375, -0.79010009765625, -0.734649658203125, -0.67919921875, -0.623748779296875, -0.56829833984375, -0.512847900390625, -0.4573974609375, -0.401947021484375, -0.34649658203125, -0.291046142578125, -0.235595703125, -0.180145263671875, -0.12469482421875, -0.069244384765625, -0.0137939453125, 0.041656494140625, 0.09710693359375, 0.152557373046875, 0.2080078125, 0.263458251953125, 0.31890869140625, 0.374359130859375, 0.4298095703125, 0.485260009765625, 0.54071044921875, 0.596160888671875, 0.651611328125, 0.707061767578125, 0.76251220703125, 0.817962646484375, 0.8734130859375, 0.928863525390625, 0.98431396484375, 1.039764404296875, 1.09521484375, 1.150665283203125, 1.20611572265625, 1.261566162109375, 1.3170166015625, 1.372467041015625, 1.42791748046875, 1.483367919921875, 1.538818359375, 1.594268798828125, 1.64971923828125, 1.705169677734375, 1.7606201171875, 1.816070556640625, 1.87152099609375, 1.926971435546875, 1.982421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 14.0, 24.0, 63.0, 120.0, 335.0, 909.0, 3276.0, 15390.0, 135555.0, 3893901.0, 125258.0, 14817.0, 3184.0, 848.0, 307.0, 138.0, 58.0, 38.0, 24.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.6953125, -10.4375, -10.1796875, -9.921875, -9.6640625, -9.40625, -9.1484375, -8.890625, -8.6328125, -8.375, -8.1171875, -7.859375, -7.6015625, -7.34375, -7.0859375, -6.828125, -6.5703125, -6.3125, -6.0546875, -5.796875, -5.5390625, -5.28125, -5.0234375, -4.765625, -4.5078125, -4.25, -3.9921875, -3.734375, -3.4765625, -3.21875, -2.9609375, -2.703125, -2.4453125, -2.1875, -1.9296875, -1.671875, -1.4140625, -1.15625, -0.8984375, -0.640625, -0.3828125, -0.125, 0.1328125, 0.390625, 0.6484375, 0.90625, 1.1640625, 1.421875, 1.6796875, 1.9375, 2.1953125, 2.453125, 2.7109375, 2.96875, 3.2265625, 3.484375, 3.7421875, 4.0, 4.2578125, 4.515625, 4.7734375, 5.03125, 5.2890625, 5.546875, 5.8046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 16.0, 29.0, 46.0, 43.0, 89.0, 141.0, 359.0, 1616.0, 1054.0, 274.0, 136.0, 74.0, 54.0, 35.0, 20.0, 21.0, 18.0, 9.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.75836181640625, -5.5440673828125, -5.32977294921875, -5.115478515625, -4.90118408203125, -4.6868896484375, -4.47259521484375, -4.25830078125, -4.04400634765625, -3.8297119140625, -3.61541748046875, -3.401123046875, -3.18682861328125, -2.9725341796875, -2.75823974609375, -2.5439453125, -2.32965087890625, -2.1153564453125, -1.90106201171875, -1.686767578125, -1.47247314453125, -1.2581787109375, -1.04388427734375, -0.82958984375, -0.61529541015625, -0.4010009765625, -0.18670654296875, 0.027587890625, 0.24188232421875, 0.4561767578125, 0.67047119140625, 0.884765625, 1.09906005859375, 1.3133544921875, 1.52764892578125, 1.741943359375, 1.95623779296875, 2.1705322265625, 2.38482666015625, 2.59912109375, 2.81341552734375, 3.0277099609375, 3.24200439453125, 3.456298828125, 3.67059326171875, 3.8848876953125, 4.09918212890625, 4.3134765625, 4.52777099609375, 4.7420654296875, 4.95635986328125, 5.170654296875, 5.38494873046875, 5.5992431640625, 5.81353759765625, 6.02783203125, 6.24212646484375, 6.4564208984375, 6.67071533203125, 6.885009765625, 7.09930419921875, 7.3135986328125, 7.52789306640625, 7.7421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 13.0, 30.0, 37.0, 65.0, 138.0, 219.0, 175.0, 119.0, 72.0, 50.0, 23.0, 14.0, 5.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.504051208496094, -51.117774963378906, -49.73149871826172, -48.34522247314453, -46.958946228027344, -45.572669982910156, -44.18639373779297, -42.80011749267578, -41.413841247558594, -40.027565002441406, -38.64128875732422, -37.25501251220703, -35.868736267089844, -34.482460021972656, -33.09618377685547, -31.70990753173828, -30.323633193969727, -28.93735694885254, -27.55108070373535, -26.164804458618164, -24.778528213500977, -23.39225196838379, -22.005977630615234, -20.619701385498047, -19.23342514038086, -17.847148895263672, -16.460872650146484, -15.074596405029297, -13.68832015991211, -12.302043914794922, -10.91576862335205, -9.529492378234863, -8.14321517944336, -6.756938934326172, -5.370662689208984, -3.984386920928955, -2.5981106758117676, -1.21183443069458, 0.17444133758544922, 1.5607175827026367, 2.946993827819824, 4.333270072937012, 5.719546318054199, 7.1058220863342285, 8.492097854614258, 9.878374099731445, 11.264650344848633, 12.65092658996582, 14.037202835083008, 15.423479080200195, 16.809755325317383, 18.19603157043457, 19.582307815551758, 20.968584060668945, 22.3548583984375, 23.741134643554688, 25.127410888671875, 26.513687133789062, 27.89996337890625, 29.286239624023438, 30.672515869140625, 32.05879211425781, 33.445068359375, 34.83134460449219, 36.217620849609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 10.0, 18.0, 13.0, 23.0, 25.0, 28.0, 31.0, 26.0, 26.0, 49.0, 35.0, 39.0, 46.0, 50.0, 43.0, 57.0, 67.0, 28.0, 39.0, 36.0, 32.0, 31.0, 30.0, 26.0, 23.0, 24.0, 30.0, 12.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.306528091430664, -18.70243263244629, -18.09833526611328, -17.494239807128906, -16.89014434814453, -16.286046981811523, -15.681951522827148, -15.077855110168457, -14.473758697509766, -13.869662284851074, -13.265565872192383, -12.661470413208008, -12.057374000549316, -11.453277587890625, -10.84918212890625, -10.245085716247559, -9.640989303588867, -9.036892890930176, -8.432796478271484, -7.828701019287109, -7.224604606628418, -6.620508193969727, -6.016412258148193, -5.41231632232666, -4.808219909667969, -4.204123497009277, -3.600027561187744, -2.995931386947632, -2.3918352127075195, -1.7877390384674072, -1.183642864227295, -0.5795469284057617, 0.0245513916015625, 0.6286475658416748, 1.232743740081787, 1.8368399143218994, 2.4409360885620117, 3.045032262802124, 3.6491284370422363, 4.2532243728637695, 4.857320785522461, 5.461417198181152, 6.0655131340026855, 6.669609069824219, 7.27370548248291, 7.877801895141602, 8.481897354125977, 9.085993766784668, 9.69009017944336, 10.29418659210205, 10.898283004760742, 11.502378463745117, 12.106474876403809, 12.7105712890625, 13.314666748046875, 13.918763160705566, 14.522859573364258, 15.12695598602295, 15.73105239868164, 16.335147857666016, 16.93924331665039, 17.5433406829834, 18.147436141967773, 18.75153350830078, 19.355628967285156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 13.0, 34.0, 52.0, 64.0, 120.0, 220.0, 396.0, 707.0, 1402.0, 2823.0, 6877.0, 19235.0, 66128.0, 303369.0, 492676.0, 108556.0, 28667.0, 9642.0, 3800.0, 1733.0, 940.0, 463.0, 248.0, 147.0, 77.0, 57.0, 35.0, 16.0, 15.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -5.0091552734375, -4.858154296875, -4.7071533203125, -4.55615234375, -4.4051513671875, -4.254150390625, -4.1031494140625, -3.9521484375, -3.8011474609375, -3.650146484375, -3.4991455078125, -3.34814453125, -3.1971435546875, -3.046142578125, -2.8951416015625, -2.744140625, -2.5931396484375, -2.442138671875, -2.2911376953125, -2.14013671875, -1.9891357421875, -1.838134765625, -1.6871337890625, -1.5361328125, -1.3851318359375, -1.234130859375, -1.0831298828125, -0.93212890625, -0.7811279296875, -0.630126953125, -0.4791259765625, -0.328125, -0.1771240234375, -0.026123046875, 0.1248779296875, 0.27587890625, 0.4268798828125, 0.577880859375, 0.7288818359375, 0.8798828125, 1.0308837890625, 1.181884765625, 1.3328857421875, 1.48388671875, 1.6348876953125, 1.785888671875, 1.9368896484375, 2.087890625, 2.2388916015625, 2.389892578125, 2.5408935546875, 2.69189453125, 2.8428955078125, 2.993896484375, 3.1448974609375, 3.2958984375, 3.4468994140625, 3.597900390625, 3.7489013671875, 3.89990234375, 4.0509033203125, 4.201904296875, 4.3529052734375, 4.50390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 5.0, 11.0, 16.0, 33.0, 34.0, 44.0, 42.0, 49.0, 66.0, 63.0, 83.0, 74.0, 76.0, 67.0, 66.0, 48.0, 46.0, 32.0, 30.0, 29.0, 21.0, 20.0, 11.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.767578125, -1.709686279296875, -1.65179443359375, -1.593902587890625, -1.5360107421875, -1.478118896484375, -1.42022705078125, -1.362335205078125, -1.304443359375, -1.246551513671875, -1.18865966796875, -1.130767822265625, -1.0728759765625, -1.014984130859375, -0.95709228515625, -0.899200439453125, -0.84130859375, -0.783416748046875, -0.72552490234375, -0.667633056640625, -0.6097412109375, -0.551849365234375, -0.49395751953125, -0.436065673828125, -0.378173828125, -0.320281982421875, -0.26239013671875, -0.204498291015625, -0.1466064453125, -0.088714599609375, -0.03082275390625, 0.027069091796875, 0.0849609375, 0.142852783203125, 0.20074462890625, 0.258636474609375, 0.3165283203125, 0.374420166015625, 0.43231201171875, 0.490203857421875, 0.548095703125, 0.605987548828125, 0.66387939453125, 0.721771240234375, 0.7796630859375, 0.837554931640625, 0.89544677734375, 0.953338623046875, 1.01123046875, 1.069122314453125, 1.12701416015625, 1.184906005859375, 1.2427978515625, 1.300689697265625, 1.35858154296875, 1.416473388671875, 1.474365234375, 1.532257080078125, 1.59014892578125, 1.648040771484375, 1.7059326171875, 1.763824462890625, 1.82171630859375, 1.879608154296875, 1.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 15.0, 24.0, 26.0, 48.0, 56.0, 74.0, 134.0, 197.0, 401.0, 783.0, 1695.0, 4312.0, 15682.0, 103588.0, 765126.0, 130143.0, 17943.0, 4688.0, 1649.0, 839.0, 444.0, 228.0, 161.0, 96.0, 56.0, 43.0, 22.0, 19.0, 9.0, 10.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.32305908203125, -7.1226806640625, -6.92230224609375, -6.721923828125, -6.52154541015625, -6.3211669921875, -6.12078857421875, -5.92041015625, -5.72003173828125, -5.5196533203125, -5.31927490234375, -5.118896484375, -4.91851806640625, -4.7181396484375, -4.51776123046875, -4.3173828125, -4.11700439453125, -3.9166259765625, -3.71624755859375, -3.515869140625, -3.31549072265625, -3.1151123046875, -2.91473388671875, -2.71435546875, -2.51397705078125, -2.3135986328125, -2.11322021484375, -1.912841796875, -1.71246337890625, -1.5120849609375, -1.31170654296875, -1.111328125, -0.91094970703125, -0.7105712890625, -0.51019287109375, -0.309814453125, -0.10943603515625, 0.0909423828125, 0.29132080078125, 0.49169921875, 0.69207763671875, 0.8924560546875, 1.09283447265625, 1.293212890625, 1.49359130859375, 1.6939697265625, 1.89434814453125, 2.0947265625, 2.29510498046875, 2.4954833984375, 2.69586181640625, 2.896240234375, 3.09661865234375, 3.2969970703125, 3.49737548828125, 3.69775390625, 3.89813232421875, 4.0985107421875, 4.29888916015625, 4.499267578125, 4.69964599609375, 4.9000244140625, 5.10040283203125, 5.30078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 10.0, 11.0, 22.0, 26.0, 20.0, 33.0, 42.0, 39.0, 53.0, 53.0, 59.0, 61.0, 62.0, 62.0, 53.0, 62.0, 58.0, 52.0, 38.0, 28.0, 23.0, 23.0, 15.0, 21.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.14306640625, -6.9267578125, -6.71044921875, -6.494140625, -6.27783203125, -6.0615234375, -5.84521484375, -5.62890625, -5.41259765625, -5.1962890625, -4.97998046875, -4.763671875, -4.54736328125, -4.3310546875, -4.11474609375, -3.8984375, -3.68212890625, -3.4658203125, -3.24951171875, -3.033203125, -2.81689453125, -2.6005859375, -2.38427734375, -2.16796875, -1.95166015625, -1.7353515625, -1.51904296875, -1.302734375, -1.08642578125, -0.8701171875, -0.65380859375, -0.4375, -0.22119140625, -0.0048828125, 0.21142578125, 0.427734375, 0.64404296875, 0.8603515625, 1.07666015625, 1.29296875, 1.50927734375, 1.7255859375, 1.94189453125, 2.158203125, 2.37451171875, 2.5908203125, 2.80712890625, 3.0234375, 3.23974609375, 3.4560546875, 3.67236328125, 3.888671875, 4.10498046875, 4.3212890625, 4.53759765625, 4.75390625, 4.97021484375, 5.1865234375, 5.40283203125, 5.619140625, 5.83544921875, 6.0517578125, 6.26806640625, 6.484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 10.0, 22.0, 15.0, 52.0, 60.0, 148.0, 324.0, 804.0, 2624.0, 17437.0, 835336.0, 180916.0, 8089.0, 1628.0, 566.0, 241.0, 110.0, 58.0, 37.0, 25.0, 10.0, 8.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.078125, -5.90362548828125, -5.7291259765625, -5.55462646484375, -5.380126953125, -5.20562744140625, -5.0311279296875, -4.85662841796875, -4.68212890625, -4.50762939453125, -4.3331298828125, -4.15863037109375, -3.984130859375, -3.80963134765625, -3.6351318359375, -3.46063232421875, -3.2861328125, -3.11163330078125, -2.9371337890625, -2.76263427734375, -2.588134765625, -2.41363525390625, -2.2391357421875, -2.06463623046875, -1.89013671875, -1.71563720703125, -1.5411376953125, -1.36663818359375, -1.192138671875, -1.01763916015625, -0.8431396484375, -0.66864013671875, -0.494140625, -0.31964111328125, -0.1451416015625, 0.02935791015625, 0.203857421875, 0.37835693359375, 0.5528564453125, 0.72735595703125, 0.90185546875, 1.07635498046875, 1.2508544921875, 1.42535400390625, 1.599853515625, 1.77435302734375, 1.9488525390625, 2.12335205078125, 2.2978515625, 2.47235107421875, 2.6468505859375, 2.82135009765625, 2.995849609375, 3.17034912109375, 3.3448486328125, 3.51934814453125, 3.69384765625, 3.86834716796875, 4.0428466796875, 4.21734619140625, 4.391845703125, 4.56634521484375, 4.7408447265625, 4.91534423828125, 5.08984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 9.0, 10.0, 22.0, 38.0, 48.0, 69.0, 126.0, 172.0, 194.0, 112.0, 58.0, 48.0, 25.0, 21.0, 9.0, 8.0, 8.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00043010711669921875, -0.00040959566831588745, -0.00038908421993255615, -0.00036857277154922485, -0.00034806132316589355, -0.00032754987478256226, -0.00030703842639923096, -0.00028652697801589966, -0.00026601552963256836, -0.00024550408124923706, -0.00022499263286590576, -0.00020448118448257446, -0.00018396973609924316, -0.00016345828771591187, -0.00014294683933258057, -0.00012243539094924927, -0.00010192394256591797, -8.141249418258667e-05, -6.090104579925537e-05, -4.038959741592407e-05, -1.9878149032592773e-05, 6.332993507385254e-07, 2.1144747734069824e-05, 4.165619611740112e-05, 6.216764450073242e-05, 8.267909288406372e-05, 0.00010319054126739502, 0.00012370198965072632, 0.00014421343803405762, 0.00016472488641738892, 0.00018523633480072021, 0.00020574778318405151, 0.0002262592315673828, 0.0002467706799507141, 0.0002672821283340454, 0.0002877935767173767, 0.000308305025100708, 0.0003288164734840393, 0.0003493279218673706, 0.0003698393702507019, 0.0003903508186340332, 0.0004108622670173645, 0.0004313737154006958, 0.0004518851637840271, 0.0004723966121673584, 0.0004929080605506897, 0.000513419508934021, 0.0005339309573173523, 0.0005544424057006836, 0.0005749538540840149, 0.0005954653024673462, 0.0006159767508506775, 0.0006364881992340088, 0.0006569996476173401, 0.0006775110960006714, 0.0006980225443840027, 0.000718533992767334, 0.0007390454411506653, 0.0007595568895339966, 0.0007800683379173279, 0.0008005797863006592, 0.0008210912346839905, 0.0008416026830673218, 0.0008621141314506531, 0.0008826255798339844]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 5.0, 6.0, 4.0, 15.0, 11.0, 41.0, 42.0, 56.0, 104.0, 191.0, 383.0, 904.0, 2487.0, 10165.0, 125963.0, 858724.0, 40952.0, 5546.0, 1589.0, 615.0, 280.0, 170.0, 100.0, 62.0, 39.0, 29.0, 17.0, 15.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.18359375, -5.055023193359375, -4.92645263671875, -4.797882080078125, -4.6693115234375, -4.540740966796875, -4.41217041015625, -4.283599853515625, -4.155029296875, -4.026458740234375, -3.89788818359375, -3.769317626953125, -3.6407470703125, -3.512176513671875, -3.38360595703125, -3.255035400390625, -3.12646484375, -2.997894287109375, -2.86932373046875, -2.740753173828125, -2.6121826171875, -2.483612060546875, -2.35504150390625, -2.226470947265625, -2.097900390625, -1.969329833984375, -1.84075927734375, -1.712188720703125, -1.5836181640625, -1.455047607421875, -1.32647705078125, -1.197906494140625, -1.0693359375, -0.940765380859375, -0.81219482421875, -0.683624267578125, -0.5550537109375, -0.426483154296875, -0.29791259765625, -0.169342041015625, -0.040771484375, 0.087799072265625, 0.21636962890625, 0.344940185546875, 0.4735107421875, 0.602081298828125, 0.73065185546875, 0.859222412109375, 0.98779296875, 1.116363525390625, 1.24493408203125, 1.373504638671875, 1.5020751953125, 1.630645751953125, 1.75921630859375, 1.887786865234375, 2.016357421875, 2.144927978515625, 2.27349853515625, 2.402069091796875, 2.5306396484375, 2.659210205078125, 2.78778076171875, 2.916351318359375, 3.044921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 8.0, 14.0, 25.0, 24.0, 32.0, 29.0, 55.0, 63.0, 96.0, 114.0, 115.0, 90.0, 87.0, 48.0, 38.0, 26.0, 25.0, 25.0, 15.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.7394866943359375, -3.648895263671875, -3.5583038330078125, -3.46771240234375, -3.3771209716796875, -3.286529541015625, -3.1959381103515625, -3.1053466796875, -3.0147552490234375, -2.924163818359375, -2.8335723876953125, -2.74298095703125, -2.6523895263671875, -2.561798095703125, -2.4712066650390625, -2.380615234375, -2.2900238037109375, -2.199432373046875, -2.1088409423828125, -2.01824951171875, -1.9276580810546875, -1.837066650390625, -1.7464752197265625, -1.6558837890625, -1.5652923583984375, -1.474700927734375, -1.3841094970703125, -1.29351806640625, -1.2029266357421875, -1.112335205078125, -1.0217437744140625, -0.93115234375, -0.8405609130859375, -0.749969482421875, -0.6593780517578125, -0.56878662109375, -0.4781951904296875, -0.387603759765625, -0.2970123291015625, -0.2064208984375, -0.1158294677734375, -0.025238037109375, 0.0653533935546875, 0.15594482421875, 0.2465362548828125, 0.337127685546875, 0.4277191162109375, 0.518310546875, 0.6089019775390625, 0.699493408203125, 0.7900848388671875, 0.88067626953125, 0.9712677001953125, 1.061859130859375, 1.1524505615234375, 1.2430419921875, 1.3336334228515625, 1.424224853515625, 1.5148162841796875, 1.60540771484375, 1.6959991455078125, 1.786590576171875, 1.8771820068359375, 1.9677734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 64.0, 141.0, 268.0, 246.0, 126.0, 55.0, 20.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.88066101074219, -81.82772064208984, -79.77478790283203, -77.72184753417969, -75.66891479492188, -73.61597442626953, -71.56303405761719, -69.51010131835938, -67.45716094970703, -65.40422058105469, -63.351287841796875, -61.29834747314453, -59.24541091918945, -57.192474365234375, -55.13953399658203, -53.08659744262695, -51.033660888671875, -48.9807243347168, -46.92778778076172, -44.874847412109375, -42.8219108581543, -40.76897430419922, -38.716033935546875, -36.6630973815918, -34.61016082763672, -32.55722427368164, -30.50428581237793, -28.45134735107422, -26.39841079711914, -24.345474243164062, -22.29253578186035, -20.23959732055664, -18.18665313720703, -16.133716583251953, -14.080778121948242, -12.027840614318848, -9.974903106689453, -7.921965599060059, -5.869028091430664, -3.8160905838012695, -1.763153076171875, 0.28978443145751953, 2.342721939086914, 4.395659446716309, 6.448596954345703, 8.501534461975098, 10.554471969604492, 12.607409477233887, 14.660346984863281, 16.71328353881836, 18.76622200012207, 20.81916046142578, 22.87209701538086, 24.925033569335938, 26.97797203063965, 29.03091049194336, 31.083847045898438, 33.136783599853516, 35.189720153808594, 37.24266052246094, 39.295597076416016, 41.348533630371094, 43.40147399902344, 45.454410552978516, 47.507347106933594]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 7.0, 10.0, 8.0, 30.0, 25.0, 24.0, 31.0, 38.0, 65.0, 62.0, 70.0, 79.0, 74.0, 66.0, 55.0, 58.0, 58.0, 49.0, 27.0, 30.0, 21.0, 24.0, 13.0, 16.0, 15.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-40.44575500488281, -39.4511604309082, -38.456565856933594, -37.46196746826172, -36.46737289428711, -35.4727783203125, -34.47818374633789, -33.48358917236328, -32.488990783691406, -31.494396209716797, -30.499799728393555, -29.505205154418945, -28.510608673095703, -27.516014099121094, -26.521419525146484, -25.526824951171875, -24.532230377197266, -23.537635803222656, -22.543039321899414, -21.548444747924805, -20.553848266601562, -19.559253692626953, -18.564659118652344, -17.570064544677734, -16.575468063354492, -15.580872535705566, -14.58627700805664, -13.591682434082031, -12.597086906433105, -11.60249137878418, -10.60789680480957, -9.613301277160645, -8.618705749511719, -7.624110221862793, -6.629515171051025, -5.634920120239258, -4.640324592590332, -3.6457290649414062, -2.6511340141296387, -1.656538963317871, -0.6619434356689453, 0.33265185356140137, 1.327247142791748, 2.3218424320220947, 3.3164377212524414, 4.311033248901367, 5.305628299713135, 6.300223350524902, 7.294818878173828, 8.289414405822754, 9.28400993347168, 10.278604507446289, 11.273200035095215, 12.26779556274414, 13.26239013671875, 14.256985664367676, 15.251581192016602, 16.24617576599121, 17.240772247314453, 18.235366821289062, 19.229961395263672, 20.224557876586914, 21.219152450561523, 22.213748931884766, 23.208343505859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 13.0, 4.0, 9.0, 15.0, 12.0, 17.0, 37.0, 37.0, 56.0, 84.0, 111.0, 157.0, 226.0, 293.0, 471.0, 732.0, 1260.0, 2121.0, 4267.0, 8944.0, 22696.0, 97100.0, 3234350.0, 730437.0, 58387.0, 17422.0, 7313.0, 3389.0, 1766.0, 927.0, 618.0, 343.0, 206.0, 139.0, 96.0, 68.0, 39.0, 28.0, 25.0, 16.0, 13.0, 7.0, 11.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0], "bins": [-3.44140625, -3.350433349609375, -3.25946044921875, -3.168487548828125, -3.0775146484375, -2.986541748046875, -2.89556884765625, -2.804595947265625, -2.713623046875, -2.622650146484375, -2.53167724609375, -2.440704345703125, -2.3497314453125, -2.258758544921875, -2.16778564453125, -2.076812744140625, -1.98583984375, -1.894866943359375, -1.80389404296875, -1.712921142578125, -1.6219482421875, -1.530975341796875, -1.44000244140625, -1.349029541015625, -1.258056640625, -1.167083740234375, -1.07611083984375, -0.985137939453125, -0.8941650390625, -0.803192138671875, -0.71221923828125, -0.621246337890625, -0.5302734375, -0.439300537109375, -0.34832763671875, -0.257354736328125, -0.1663818359375, -0.075408935546875, 0.01556396484375, 0.106536865234375, 0.197509765625, 0.288482666015625, 0.37945556640625, 0.470428466796875, 0.5614013671875, 0.652374267578125, 0.74334716796875, 0.834320068359375, 0.92529296875, 1.016265869140625, 1.10723876953125, 1.198211669921875, 1.2891845703125, 1.380157470703125, 1.47113037109375, 1.562103271484375, 1.653076171875, 1.744049072265625, 1.83502197265625, 1.925994873046875, 2.0169677734375, 2.107940673828125, 2.19891357421875, 2.289886474609375, 2.380859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 12.0, 16.0, 29.0, 54.0, 59.0, 82.0, 100.0, 95.0, 109.0, 114.0, 87.0, 59.0, 48.0, 41.0, 30.0, 20.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.2507781982421875, -3.175384521484375, -3.0999908447265625, -3.02459716796875, -2.9492034912109375, -2.873809814453125, -2.7984161376953125, -2.7230224609375, -2.6476287841796875, -2.572235107421875, -2.4968414306640625, -2.42144775390625, -2.3460540771484375, -2.270660400390625, -2.1952667236328125, -2.119873046875, -2.0444793701171875, -1.969085693359375, -1.8936920166015625, -1.81829833984375, -1.7429046630859375, -1.667510986328125, -1.5921173095703125, -1.5167236328125, -1.4413299560546875, -1.365936279296875, -1.2905426025390625, -1.21514892578125, -1.1397552490234375, -1.064361572265625, -0.9889678955078125, -0.91357421875, -0.8381805419921875, -0.762786865234375, -0.6873931884765625, -0.61199951171875, -0.5366058349609375, -0.461212158203125, -0.3858184814453125, -0.3104248046875, -0.2350311279296875, -0.159637451171875, -0.0842437744140625, -0.00885009765625, 0.0665435791015625, 0.141937255859375, 0.2173309326171875, 0.292724609375, 0.3681182861328125, 0.443511962890625, 0.5189056396484375, 0.59429931640625, 0.6696929931640625, 0.745086669921875, 0.8204803466796875, 0.8958740234375, 0.9712677001953125, 1.046661376953125, 1.1220550537109375, 1.19744873046875, 1.2728424072265625, 1.348236083984375, 1.4236297607421875, 1.4990234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 24.0, 26.0, 44.0, 62.0, 98.0, 161.0, 311.0, 590.0, 1159.0, 2337.0, 5161.0, 12445.0, 35346.0, 158156.0, 3372465.0, 510553.0, 63027.0, 18662.0, 7044.0, 3257.0, 1615.0, 761.0, 402.0, 240.0, 127.0, 80.0, 34.0, 32.0, 23.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.401885986328125, -3.29791259765625, -3.193939208984375, -3.0899658203125, -2.985992431640625, -2.88201904296875, -2.778045654296875, -2.674072265625, -2.570098876953125, -2.46612548828125, -2.362152099609375, -2.2581787109375, -2.154205322265625, -2.05023193359375, -1.946258544921875, -1.84228515625, -1.738311767578125, -1.63433837890625, -1.530364990234375, -1.4263916015625, -1.322418212890625, -1.21844482421875, -1.114471435546875, -1.010498046875, -0.906524658203125, -0.80255126953125, -0.698577880859375, -0.5946044921875, -0.490631103515625, -0.38665771484375, -0.282684326171875, -0.1787109375, -0.074737548828125, 0.02923583984375, 0.133209228515625, 0.2371826171875, 0.341156005859375, 0.44512939453125, 0.549102783203125, 0.653076171875, 0.757049560546875, 0.86102294921875, 0.964996337890625, 1.0689697265625, 1.172943115234375, 1.27691650390625, 1.380889892578125, 1.48486328125, 1.588836669921875, 1.69281005859375, 1.796783447265625, 1.9007568359375, 2.004730224609375, 2.10870361328125, 2.212677001953125, 2.316650390625, 2.420623779296875, 2.52459716796875, 2.628570556640625, 2.7325439453125, 2.836517333984375, 2.94049072265625, 3.044464111328125, 3.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 8.0, 9.0, 17.0, 12.0, 28.0, 34.0, 36.0, 52.0, 57.0, 150.0, 263.0, 605.0, 1218.0, 702.0, 343.0, 148.0, 98.0, 61.0, 49.0, 30.0, 32.0, 22.0, 8.0, 10.0, 9.0, 4.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.095367431640625, -2.99737548828125, -2.899383544921875, -2.8013916015625, -2.703399658203125, -2.60540771484375, -2.507415771484375, -2.409423828125, -2.311431884765625, -2.21343994140625, -2.115447998046875, -2.0174560546875, -1.919464111328125, -1.82147216796875, -1.723480224609375, -1.62548828125, -1.527496337890625, -1.42950439453125, -1.331512451171875, -1.2335205078125, -1.135528564453125, -1.03753662109375, -0.939544677734375, -0.841552734375, -0.743560791015625, -0.64556884765625, -0.547576904296875, -0.4495849609375, -0.351593017578125, -0.25360107421875, -0.155609130859375, -0.0576171875, 0.040374755859375, 0.13836669921875, 0.236358642578125, 0.3343505859375, 0.432342529296875, 0.53033447265625, 0.628326416015625, 0.726318359375, 0.824310302734375, 0.92230224609375, 1.020294189453125, 1.1182861328125, 1.216278076171875, 1.31427001953125, 1.412261962890625, 1.51025390625, 1.608245849609375, 1.70623779296875, 1.804229736328125, 1.9022216796875, 2.000213623046875, 2.09820556640625, 2.196197509765625, 2.294189453125, 2.392181396484375, 2.49017333984375, 2.588165283203125, 2.6861572265625, 2.784149169921875, 2.88214111328125, 2.980133056640625, 3.078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 27.0, 61.0, 142.0, 248.0, 269.0, 122.0, 51.0, 22.0, 13.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.43701934814453, -44.16937255859375, -42.901729583740234, -41.63408279418945, -40.36643981933594, -39.098793029785156, -37.831146240234375, -36.563499450683594, -35.29585647583008, -34.0282096862793, -32.76056671142578, -31.492919921875, -30.22527503967285, -28.957630157470703, -27.689983367919922, -26.422338485717773, -25.154693603515625, -23.887048721313477, -22.619403839111328, -21.351757049560547, -20.0841121673584, -18.81646728515625, -17.54882049560547, -16.28117561340332, -15.013530731201172, -13.745885848999023, -12.478240013122559, -11.210594177246094, -9.942949295043945, -8.675304412841797, -7.407658576965332, -6.140012741088867, -4.872364044189453, -3.6047186851501465, -2.33707332611084, -1.0694279670715332, 0.19821739196777344, 1.46586275100708, 2.7335081100463867, 4.001153945922852, 5.268798828125, 6.536444187164307, 7.804089546203613, 9.071735382080078, 10.339380264282227, 11.607025146484375, 12.87467098236084, 14.142316818237305, 15.409961700439453, 16.6776065826416, 17.94525146484375, 19.21289825439453, 20.48054313659668, 21.748188018798828, 23.01583480834961, 24.283479690551758, 25.551124572753906, 26.818769454956055, 28.086414337158203, 29.354061126708984, 30.621706008911133, 31.88935089111328, 33.15699768066406, 34.424644470214844, 35.69228744506836]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 12.0, 8.0, 14.0, 12.0, 12.0, 15.0, 18.0, 25.0, 15.0, 27.0, 33.0, 31.0, 28.0, 25.0, 32.0, 44.0, 49.0, 51.0, 39.0, 50.0, 44.0, 43.0, 34.0, 37.0, 29.0, 37.0, 37.0, 29.0, 17.0, 25.0, 10.0, 18.0, 17.0, 14.0, 8.0, 8.0, 5.0, 6.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.222179412841797, -10.851251602172852, -10.480324745178223, -10.109396934509277, -9.738469123840332, -9.367541313171387, -8.996614456176758, -8.625686645507812, -8.254758834838867, -7.88383150100708, -7.512903690338135, -7.141976356506348, -6.771048545837402, -6.400121212005615, -6.029193878173828, -5.658266067504883, -5.287338733673096, -4.916411399841309, -4.545483589172363, -4.174556255340576, -3.803628444671631, -3.4327011108398438, -3.0617735385894775, -2.6908459663391113, -2.319918394088745, -1.948990821838379, -1.5780632495880127, -1.207135796546936, -0.8362082242965698, -0.4652806520462036, -0.09435319900512695, 0.27657437324523926, 0.6475019454956055, 1.0184295177459717, 1.389357089996338, 1.7602845430374146, 2.1312122344970703, 2.5021395683288574, 2.8730671405792236, 3.24399471282959, 3.614922285079956, 3.9858498573303223, 4.356777191162109, 4.727705001831055, 5.098632335662842, 5.469560146331787, 5.840487480163574, 6.2114152908325195, 6.582342624664307, 6.953269958496094, 7.324197769165039, 7.695125102996826, 8.066052436828613, 8.436980247497559, 8.807908058166504, 9.178834915161133, 9.549762725830078, 9.920690536499023, 10.291617393493652, 10.662545204162598, 11.033473014831543, 11.404400825500488, 11.775327682495117, 12.146255493164062, 12.517183303833008]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 7.0, 12.0, 11.0, 18.0, 32.0, 50.0, 51.0, 79.0, 120.0, 202.0, 270.0, 454.0, 690.0, 1187.0, 2099.0, 4123.0, 9196.0, 23504.0, 68653.0, 239542.0, 472439.0, 149015.0, 45895.0, 16540.0, 6794.0, 3165.0, 1706.0, 1022.0, 579.0, 344.0, 224.0, 155.0, 120.0, 71.0, 49.0, 38.0, 34.0, 19.0, 17.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.361328125, -3.25732421875, -3.1533203125, -3.04931640625, -2.9453125, -2.84130859375, -2.7373046875, -2.63330078125, -2.529296875, -2.42529296875, -2.3212890625, -2.21728515625, -2.11328125, -2.00927734375, -1.9052734375, -1.80126953125, -1.697265625, -1.59326171875, -1.4892578125, -1.38525390625, -1.28125, -1.17724609375, -1.0732421875, -0.96923828125, -0.865234375, -0.76123046875, -0.6572265625, -0.55322265625, -0.44921875, -0.34521484375, -0.2412109375, -0.13720703125, -0.033203125, 0.07080078125, 0.1748046875, 0.27880859375, 0.3828125, 0.48681640625, 0.5908203125, 0.69482421875, 0.798828125, 0.90283203125, 1.0068359375, 1.11083984375, 1.21484375, 1.31884765625, 1.4228515625, 1.52685546875, 1.630859375, 1.73486328125, 1.8388671875, 1.94287109375, 2.046875, 2.15087890625, 2.2548828125, 2.35888671875, 2.462890625, 2.56689453125, 2.6708984375, 2.77490234375, 2.87890625, 2.98291015625, 3.0869140625, 3.19091796875, 3.294921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 8.0, 6.0, 11.0, 10.0, 31.0, 35.0, 30.0, 51.0, 56.0, 73.0, 75.0, 71.0, 75.0, 73.0, 75.0, 57.0, 49.0, 39.0, 37.0, 42.0, 28.0, 14.0, 20.0, 11.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9340972900390625, -1.877960205078125, -1.8218231201171875, -1.76568603515625, -1.7095489501953125, -1.653411865234375, -1.5972747802734375, -1.5411376953125, -1.4850006103515625, -1.428863525390625, -1.3727264404296875, -1.31658935546875, -1.2604522705078125, -1.204315185546875, -1.1481781005859375, -1.092041015625, -1.0359039306640625, -0.979766845703125, -0.9236297607421875, -0.86749267578125, -0.8113555908203125, -0.755218505859375, -0.6990814208984375, -0.6429443359375, -0.5868072509765625, -0.530670166015625, -0.4745330810546875, -0.41839599609375, -0.3622589111328125, -0.306121826171875, -0.2499847412109375, -0.19384765625, -0.1377105712890625, -0.081573486328125, -0.0254364013671875, 0.03070068359375, 0.0868377685546875, 0.142974853515625, 0.1991119384765625, 0.2552490234375, 0.3113861083984375, 0.367523193359375, 0.4236602783203125, 0.47979736328125, 0.5359344482421875, 0.592071533203125, 0.6482086181640625, 0.704345703125, 0.7604827880859375, 0.816619873046875, 0.8727569580078125, 0.92889404296875, 0.9850311279296875, 1.041168212890625, 1.0973052978515625, 1.1534423828125, 1.2095794677734375, 1.265716552734375, 1.3218536376953125, 1.37799072265625, 1.4341278076171875, 1.490264892578125, 1.5464019775390625, 1.6025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 16.0, 24.0, 56.0, 71.0, 126.0, 227.0, 424.0, 963.0, 2951.0, 13287.0, 120502.0, 806950.0, 87760.0, 10877.0, 2563.0, 852.0, 417.0, 189.0, 105.0, 60.0, 36.0, 31.0, 13.0, 11.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66766357421875, -6.4486083984375, -6.22955322265625, -6.010498046875, -5.79144287109375, -5.5723876953125, -5.35333251953125, -5.13427734375, -4.91522216796875, -4.6961669921875, -4.47711181640625, -4.258056640625, -4.03900146484375, -3.8199462890625, -3.60089111328125, -3.3818359375, -3.16278076171875, -2.9437255859375, -2.72467041015625, -2.505615234375, -2.28656005859375, -2.0675048828125, -1.84844970703125, -1.62939453125, -1.41033935546875, -1.1912841796875, -0.97222900390625, -0.753173828125, -0.53411865234375, -0.3150634765625, -0.09600830078125, 0.123046875, 0.34210205078125, 0.5611572265625, 0.78021240234375, 0.999267578125, 1.21832275390625, 1.4373779296875, 1.65643310546875, 1.87548828125, 2.09454345703125, 2.3135986328125, 2.53265380859375, 2.751708984375, 2.97076416015625, 3.1898193359375, 3.40887451171875, 3.6279296875, 3.84698486328125, 4.0660400390625, 4.28509521484375, 4.504150390625, 4.72320556640625, 4.9422607421875, 5.16131591796875, 5.38037109375, 5.59942626953125, 5.8184814453125, 6.03753662109375, 6.256591796875, 6.47564697265625, 6.6947021484375, 6.91375732421875, 7.1328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 19.0, 25.0, 21.0, 26.0, 24.0, 30.0, 43.0, 42.0, 43.0, 45.0, 48.0, 63.0, 65.0, 41.0, 48.0, 41.0, 46.0, 31.0, 42.0, 42.0, 22.0, 23.0, 22.0, 20.0, 10.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -3.97186279296875, -3.8265380859375, -3.68121337890625, -3.535888671875, -3.39056396484375, -3.2452392578125, -3.09991455078125, -2.95458984375, -2.80926513671875, -2.6639404296875, -2.51861572265625, -2.373291015625, -2.22796630859375, -2.0826416015625, -1.93731689453125, -1.7919921875, -1.64666748046875, -1.5013427734375, -1.35601806640625, -1.210693359375, -1.06536865234375, -0.9200439453125, -0.77471923828125, -0.62939453125, -0.48406982421875, -0.3387451171875, -0.19342041015625, -0.048095703125, 0.09722900390625, 0.2425537109375, 0.38787841796875, 0.533203125, 0.67852783203125, 0.8238525390625, 0.96917724609375, 1.114501953125, 1.25982666015625, 1.4051513671875, 1.55047607421875, 1.69580078125, 1.84112548828125, 1.9864501953125, 2.13177490234375, 2.277099609375, 2.42242431640625, 2.5677490234375, 2.71307373046875, 2.8583984375, 3.00372314453125, 3.1490478515625, 3.29437255859375, 3.439697265625, 3.58502197265625, 3.7303466796875, 3.87567138671875, 4.02099609375, 4.16632080078125, 4.3116455078125, 4.45697021484375, 4.602294921875, 4.74761962890625, 4.8929443359375, 5.03826904296875, 5.18359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 11.0, 14.0, 22.0, 59.0, 116.0, 236.0, 546.0, 1882.0, 11894.0, 307544.0, 703347.0, 19082.0, 2533.0, 672.0, 262.0, 117.0, 75.0, 37.0, 32.0, 14.0, 8.0, 3.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.660308837890625, -3.55889892578125, -3.457489013671875, -3.3560791015625, -3.254669189453125, -3.15325927734375, -3.051849365234375, -2.950439453125, -2.849029541015625, -2.74761962890625, -2.646209716796875, -2.5447998046875, -2.443389892578125, -2.34197998046875, -2.240570068359375, -2.13916015625, -2.037750244140625, -1.93634033203125, -1.834930419921875, -1.7335205078125, -1.632110595703125, -1.53070068359375, -1.429290771484375, -1.327880859375, -1.226470947265625, -1.12506103515625, -1.023651123046875, -0.9222412109375, -0.820831298828125, -0.71942138671875, -0.618011474609375, -0.5166015625, -0.415191650390625, -0.31378173828125, -0.212371826171875, -0.1109619140625, -0.009552001953125, 0.09185791015625, 0.193267822265625, 0.294677734375, 0.396087646484375, 0.49749755859375, 0.598907470703125, 0.7003173828125, 0.801727294921875, 0.90313720703125, 1.004547119140625, 1.10595703125, 1.207366943359375, 1.30877685546875, 1.410186767578125, 1.5115966796875, 1.613006591796875, 1.71441650390625, 1.815826416015625, 1.917236328125, 2.018646240234375, 2.12005615234375, 2.221466064453125, 2.3228759765625, 2.424285888671875, 2.52569580078125, 2.627105712890625, 2.728515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 14.0, 10.0, 18.0, 36.0, 34.0, 47.0, 58.0, 78.0, 113.0, 118.0, 111.0, 95.0, 63.0, 62.0, 34.0, 34.0, 15.0, 13.0, 14.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027108192443847656, -0.0002601146697998047, -0.0002491474151611328, -0.00023818016052246094, -0.00022721290588378906, -0.0002162456512451172, -0.0002052783966064453, -0.00019431114196777344, -0.00018334388732910156, -0.0001723766326904297, -0.0001614093780517578, -0.00015044212341308594, -0.00013947486877441406, -0.0001285076141357422, -0.00011754035949707031, -0.00010657310485839844, -9.560585021972656e-05, -8.463859558105469e-05, -7.367134094238281e-05, -6.270408630371094e-05, -5.173683166503906e-05, -4.076957702636719e-05, -2.9802322387695312e-05, -1.8835067749023438e-05, -7.867813110351562e-06, 3.0994415283203125e-06, 1.4066696166992188e-05, 2.5033950805664062e-05, 3.600120544433594e-05, 4.696846008300781e-05, 5.793571472167969e-05, 6.890296936035156e-05, 7.987022399902344e-05, 9.083747863769531e-05, 0.00010180473327636719, 0.00011277198791503906, 0.00012373924255371094, 0.0001347064971923828, 0.0001456737518310547, 0.00015664100646972656, 0.00016760826110839844, 0.0001785755157470703, 0.0001895427703857422, 0.00020051002502441406, 0.00021147727966308594, 0.0002224445343017578, 0.0002334117889404297, 0.00024437904357910156, 0.00025534629821777344, 0.0002663135528564453, 0.0002772808074951172, 0.00028824806213378906, 0.00029921531677246094, 0.0003101825714111328, 0.0003211498260498047, 0.00033211708068847656, 0.00034308433532714844, 0.0003540515899658203, 0.0003650188446044922, 0.00037598609924316406, 0.00038695335388183594, 0.0003979206085205078, 0.0004088878631591797, 0.00041985511779785156, 0.00043082237243652344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 12.0, 12.0, 16.0, 31.0, 42.0, 67.0, 113.0, 173.0, 327.0, 613.0, 1368.0, 4021.0, 18452.0, 171825.0, 767641.0, 68746.0, 10161.0, 2721.0, 1061.0, 460.0, 270.0, 167.0, 87.0, 53.0, 26.0, 23.0, 16.0, 16.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8828125, -1.818603515625, -1.75439453125, -1.690185546875, -1.6259765625, -1.561767578125, -1.49755859375, -1.433349609375, -1.369140625, -1.304931640625, -1.24072265625, -1.176513671875, -1.1123046875, -1.048095703125, -0.98388671875, -0.919677734375, -0.85546875, -0.791259765625, -0.72705078125, -0.662841796875, -0.5986328125, -0.534423828125, -0.47021484375, -0.406005859375, -0.341796875, -0.277587890625, -0.21337890625, -0.149169921875, -0.0849609375, -0.020751953125, 0.04345703125, 0.107666015625, 0.171875, 0.236083984375, 0.30029296875, 0.364501953125, 0.4287109375, 0.492919921875, 0.55712890625, 0.621337890625, 0.685546875, 0.749755859375, 0.81396484375, 0.878173828125, 0.9423828125, 1.006591796875, 1.07080078125, 1.135009765625, 1.19921875, 1.263427734375, 1.32763671875, 1.391845703125, 1.4560546875, 1.520263671875, 1.58447265625, 1.648681640625, 1.712890625, 1.777099609375, 1.84130859375, 1.905517578125, 1.9697265625, 2.033935546875, 2.09814453125, 2.162353515625, 2.2265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 3.0, 9.0, 16.0, 16.0, 30.0, 33.0, 40.0, 35.0, 61.0, 56.0, 76.0, 98.0, 78.0, 76.0, 68.0, 63.0, 39.0, 40.0, 35.0, 16.0, 20.0, 24.0, 11.0, 4.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9248046875, -1.8764495849609375, -1.828094482421875, -1.7797393798828125, -1.73138427734375, -1.6830291748046875, -1.634674072265625, -1.5863189697265625, -1.5379638671875, -1.4896087646484375, -1.441253662109375, -1.3928985595703125, -1.34454345703125, -1.2961883544921875, -1.247833251953125, -1.1994781494140625, -1.151123046875, -1.1027679443359375, -1.054412841796875, -1.0060577392578125, -0.95770263671875, -0.9093475341796875, -0.860992431640625, -0.8126373291015625, -0.7642822265625, -0.7159271240234375, -0.667572021484375, -0.6192169189453125, -0.57086181640625, -0.5225067138671875, -0.474151611328125, -0.4257965087890625, -0.37744140625, -0.3290863037109375, -0.280731201171875, -0.2323760986328125, -0.18402099609375, -0.1356658935546875, -0.087310791015625, -0.0389556884765625, 0.0093994140625, 0.0577545166015625, 0.106109619140625, 0.1544647216796875, 0.20281982421875, 0.2511749267578125, 0.299530029296875, 0.3478851318359375, 0.396240234375, 0.4445953369140625, 0.492950439453125, 0.5413055419921875, 0.58966064453125, 0.6380157470703125, 0.686370849609375, 0.7347259521484375, 0.7830810546875, 0.8314361572265625, 0.879791259765625, 0.9281463623046875, 0.97650146484375, 1.0248565673828125, 1.073211669921875, 1.1215667724609375, 1.169921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 14.0, 53.0, 131.0, 345.0, 291.0, 113.0, 30.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.91323852539062, -71.73523712158203, -69.5572280883789, -67.37922668457031, -65.20121765136719, -63.023216247558594, -60.845211029052734, -58.667205810546875, -56.48920440673828, -54.31119918823242, -52.13319396972656, -49.95519256591797, -47.77718734741211, -45.59918212890625, -43.42117691040039, -41.24317169189453, -39.06516647338867, -36.88716125488281, -34.70915603637695, -32.531150817871094, -30.3531494140625, -28.17514419555664, -25.99713897705078, -23.819133758544922, -21.641130447387695, -19.463125228881836, -17.28512191772461, -15.10711669921875, -12.929112434387207, -10.751108169555664, -8.573102951049805, -6.395098686218262, -4.217094421386719, -2.0390899181365967, 0.1389145851135254, 2.3169193267822266, 4.4949235916137695, 6.6729278564453125, 8.850933074951172, 11.028937339782715, 13.206941604614258, 15.3849458694458, 17.562950134277344, 19.740955352783203, 21.918960571289062, 24.09696388244629, 26.27496910095215, 28.452972412109375, 30.630977630615234, 32.808982849121094, 34.98698806762695, 37.16499328613281, 39.342994689941406, 41.520999908447266, 43.699005126953125, 45.877010345458984, 48.055015563964844, 50.2330207824707, 52.41102600097656, 54.589027404785156, 56.767032623291016, 58.945037841796875, 61.123043060302734, 63.301048278808594, 65.47904968261719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 9.0, 15.0, 23.0, 22.0, 16.0, 31.0, 28.0, 31.0, 29.0, 41.0, 46.0, 62.0, 68.0, 69.0, 59.0, 64.0, 37.0, 30.0, 51.0, 36.0, 43.0, 31.0, 21.0, 21.0, 24.0, 15.0, 13.0, 7.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.756563186645508, -21.063051223754883, -20.369537353515625, -19.676025390625, -18.982513427734375, -18.288999557495117, -17.595487594604492, -16.901973724365234, -16.20846176147461, -15.514948844909668, -14.821435928344727, -14.127923965454102, -13.43441104888916, -12.740898132324219, -12.047386169433594, -11.353873252868652, -10.660360336303711, -9.96684741973877, -9.273334503173828, -8.579822540283203, -7.886309623718262, -7.19279670715332, -6.499284267425537, -5.805771827697754, -5.1122589111328125, -4.418745994567871, -3.725233554840088, -3.0317208766937256, -2.3382081985473633, -1.644695520401001, -0.9511828422546387, -0.25767040252685547, 0.43584442138671875, 1.129357099533081, 1.8228697776794434, 2.5163824558258057, 3.209895133972168, 3.9034078121185303, 4.596920490264893, 5.290432929992676, 5.983945846557617, 6.677458763122559, 7.370971202850342, 8.064483642578125, 8.757996559143066, 9.451509475708008, 10.145021438598633, 10.838534355163574, 11.532047271728516, 12.225560188293457, 12.919073104858398, 13.612585067749023, 14.306097984313965, 14.999610900878906, 15.693122863769531, 16.386634826660156, 17.080148696899414, 17.77366065979004, 18.467174530029297, 19.160686492919922, 19.854198455810547, 20.547712326049805, 21.24122428894043, 21.934738159179688, 22.628250122070312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 9.0, 20.0, 25.0, 32.0, 49.0, 76.0, 131.0, 250.0, 419.0, 823.0, 1640.0, 3729.0, 9186.0, 26044.0, 103478.0, 1071102.0, 2673471.0, 233502.0, 45767.0, 14388.0, 5687.0, 2334.0, 1089.0, 480.0, 258.0, 118.0, 77.0, 31.0, 14.0, 10.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.5604248046875, -2.499755859375, -2.4390869140625, -2.37841796875, -2.3177490234375, -2.257080078125, -2.1964111328125, -2.1357421875, -2.0750732421875, -2.014404296875, -1.9537353515625, -1.89306640625, -1.8323974609375, -1.771728515625, -1.7110595703125, -1.650390625, -1.5897216796875, -1.529052734375, -1.4683837890625, -1.40771484375, -1.3470458984375, -1.286376953125, -1.2257080078125, -1.1650390625, -1.1043701171875, -1.043701171875, -0.9830322265625, -0.92236328125, -0.8616943359375, -0.801025390625, -0.7403564453125, -0.6796875, -0.6190185546875, -0.558349609375, -0.4976806640625, -0.43701171875, -0.3763427734375, -0.315673828125, -0.2550048828125, -0.1943359375, -0.1336669921875, -0.072998046875, -0.0123291015625, 0.04833984375, 0.1090087890625, 0.169677734375, 0.2303466796875, 0.291015625, 0.3516845703125, 0.412353515625, 0.4730224609375, 0.53369140625, 0.5943603515625, 0.655029296875, 0.7156982421875, 0.7763671875, 0.8370361328125, 0.897705078125, 0.9583740234375, 1.01904296875, 1.0797119140625, 1.140380859375, 1.2010498046875, 1.26171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 16.0, 16.0, 22.0, 34.0, 34.0, 63.0, 66.0, 67.0, 79.0, 75.0, 88.0, 84.0, 65.0, 78.0, 52.0, 41.0, 33.0, 23.0, 24.0, 18.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6484375, -2.5921859741210938, -2.5359344482421875, -2.4796829223632812, -2.423431396484375, -2.3671798706054688, -2.3109283447265625, -2.2546768188476562, -2.19842529296875, -2.1421737670898438, -2.0859222412109375, -2.0296707153320312, -1.973419189453125, -1.9171676635742188, -1.8609161376953125, -1.8046646118164062, -1.7484130859375, -1.6921615600585938, -1.6359100341796875, -1.5796585083007812, -1.523406982421875, -1.4671554565429688, -1.4109039306640625, -1.3546524047851562, -1.29840087890625, -1.2421493530273438, -1.1858978271484375, -1.1296463012695312, -1.073394775390625, -1.0171432495117188, -0.9608917236328125, -0.9046401977539062, -0.848388671875, -0.7921371459960938, -0.7358856201171875, -0.6796340942382812, -0.623382568359375, -0.5671310424804688, -0.5108795166015625, -0.45462799072265625, -0.39837646484375, -0.34212493896484375, -0.2858734130859375, -0.22962188720703125, -0.173370361328125, -0.11711883544921875, -0.0608673095703125, -0.00461578369140625, 0.0516357421875, 0.10788726806640625, 0.1641387939453125, 0.22039031982421875, 0.276641845703125, 0.33289337158203125, 0.3891448974609375, 0.44539642333984375, 0.50164794921875, 0.5578994750976562, 0.6141510009765625, 0.6704025268554688, 0.726654052734375, 0.7829055786132812, 0.8391571044921875, 0.8954086303710938, 0.95166015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 12.0, 16.0, 13.0, 21.0, 44.0, 39.0, 96.0, 144.0, 251.0, 441.0, 953.0, 2061.0, 5204.0, 15182.0, 55558.0, 343458.0, 3334046.0, 344052.0, 61234.0, 18282.0, 6875.0, 2989.0, 1388.0, 763.0, 430.0, 246.0, 163.0, 98.0, 66.0, 39.0, 31.0, 22.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.57757568359375, -2.4930419921875, -2.40850830078125, -2.323974609375, -2.23944091796875, -2.1549072265625, -2.07037353515625, -1.98583984375, -1.90130615234375, -1.8167724609375, -1.73223876953125, -1.647705078125, -1.56317138671875, -1.4786376953125, -1.39410400390625, -1.3095703125, -1.22503662109375, -1.1405029296875, -1.05596923828125, -0.971435546875, -0.88690185546875, -0.8023681640625, -0.71783447265625, -0.63330078125, -0.54876708984375, -0.4642333984375, -0.37969970703125, -0.295166015625, -0.21063232421875, -0.1260986328125, -0.04156494140625, 0.04296875, 0.12750244140625, 0.2120361328125, 0.29656982421875, 0.381103515625, 0.46563720703125, 0.5501708984375, 0.63470458984375, 0.71923828125, 0.80377197265625, 0.8883056640625, 0.97283935546875, 1.057373046875, 1.14190673828125, 1.2264404296875, 1.31097412109375, 1.3955078125, 1.48004150390625, 1.5645751953125, 1.64910888671875, 1.733642578125, 1.81817626953125, 1.9027099609375, 1.98724365234375, 2.07177734375, 2.15631103515625, 2.2408447265625, 2.32537841796875, 2.409912109375, 2.49444580078125, 2.5789794921875, 2.66351318359375, 2.748046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 0.0, 8.0, 9.0, 6.0, 15.0, 9.0, 19.0, 19.0, 28.0, 45.0, 47.0, 74.0, 87.0, 172.0, 225.0, 412.0, 764.0, 744.0, 455.0, 256.0, 160.0, 105.0, 102.0, 74.0, 36.0, 40.0, 31.0, 23.0, 19.0, 14.0, 10.0, 16.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.169921875, -2.086669921875, -2.00341796875, -1.920166015625, -1.8369140625, -1.753662109375, -1.67041015625, -1.587158203125, -1.50390625, -1.420654296875, -1.33740234375, -1.254150390625, -1.1708984375, -1.087646484375, -1.00439453125, -0.921142578125, -0.837890625, -0.754638671875, -0.67138671875, -0.588134765625, -0.5048828125, -0.421630859375, -0.33837890625, -0.255126953125, -0.171875, -0.088623046875, -0.00537109375, 0.077880859375, 0.1611328125, 0.244384765625, 0.32763671875, 0.410888671875, 0.494140625, 0.577392578125, 0.66064453125, 0.743896484375, 0.8271484375, 0.910400390625, 0.99365234375, 1.076904296875, 1.16015625, 1.243408203125, 1.32666015625, 1.409912109375, 1.4931640625, 1.576416015625, 1.65966796875, 1.742919921875, 1.826171875, 1.909423828125, 1.99267578125, 2.075927734375, 2.1591796875, 2.242431640625, 2.32568359375, 2.408935546875, 2.4921875, 2.575439453125, 2.65869140625, 2.741943359375, 2.8251953125, 2.908447265625, 2.99169921875, 3.074951171875, 3.158203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 43.0, 134.0, 329.0, 294.0, 107.0, 38.0, 11.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229286193847656, -28.30753517150879, -26.385784149169922, -24.464035034179688, -22.542282104492188, -20.620532989501953, -18.698781967163086, -16.77703094482422, -14.855279922485352, -12.933528900146484, -11.011777877807617, -9.090027809143066, -7.168276786804199, -5.246525764465332, -3.3247756958007812, -1.403024673461914, 0.5187263488769531, 2.440477132797241, 4.362227916717529, 6.283978462219238, 8.205729484558105, 10.127480506896973, 12.049230575561523, 13.97098159790039, 15.892732620239258, 17.814483642578125, 19.736234664916992, 21.65798568725586, 23.579734802246094, 25.501487731933594, 27.423236846923828, 29.344987869262695, 31.266738891601562, 33.1884880065918, 35.1102409362793, 37.03199005126953, 38.95374298095703, 40.875492095947266, 42.7972412109375, 44.718994140625, 46.6407470703125, 48.562496185302734, 50.484249114990234, 52.40599822998047, 54.32775115966797, 56.2495002746582, 58.17124938964844, 60.09300231933594, 62.01475143432617, 63.936500549316406, 65.8582534790039, 67.7800064086914, 69.70175170898438, 71.62350463867188, 73.54525756835938, 75.46701049804688, 77.38875579833984, 79.31050872802734, 81.23225402832031, 83.15400695800781, 85.07575988769531, 86.99751281738281, 88.91925811767578, 90.84101104736328, 92.76276397705078]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 8.0, 9.0, 15.0, 15.0, 26.0, 33.0, 48.0, 34.0, 66.0, 61.0, 67.0, 54.0, 59.0, 62.0, 56.0, 61.0, 63.0, 46.0, 34.0, 27.0, 30.0, 22.0, 24.0, 17.0, 14.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.80950927734375, -16.142671585083008, -15.475834846496582, -14.808998107910156, -14.142160415649414, -13.475323677062988, -12.808486938476562, -12.14164924621582, -11.474812507629395, -10.807975769042969, -10.141138076782227, -9.4743013381958, -8.807464599609375, -8.140626907348633, -7.473790168762207, -6.806952953338623, -6.140115737915039, -5.473278522491455, -4.806441307067871, -4.139604568481445, -3.4727673530578613, -2.8059301376342773, -2.1390933990478516, -1.4722561836242676, -0.8054189682006836, -0.13858187198638916, 0.5282552242279053, 1.1950922012329102, 1.8619294166564941, 2.528766632080078, 3.195603370666504, 3.862440586090088, 4.529279708862305, 5.196116924285889, 5.862954139709473, 6.529790878295898, 7.196628093719482, 7.863465309143066, 8.530302047729492, 9.197139739990234, 9.86397647857666, 10.530813217163086, 11.197650909423828, 11.864487648010254, 12.53132438659668, 13.198162078857422, 13.864998817443848, 14.531835556030273, 15.198673248291016, 15.865509986877441, 16.532346725463867, 17.19918441772461, 17.86602210998535, 18.532859802246094, 19.199695587158203, 19.866533279418945, 20.533370971679688, 21.20020866394043, 21.86704444885254, 22.53388214111328, 23.200719833374023, 23.867557525634766, 24.534393310546875, 25.201231002807617, 25.868066787719727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 6.0, 15.0, 14.0, 35.0, 43.0, 57.0, 78.0, 116.0, 175.0, 293.0, 441.0, 803.0, 1429.0, 2742.0, 5090.0, 10122.0, 21371.0, 46154.0, 103427.0, 244941.0, 338307.0, 148890.0, 64969.0, 29868.0, 14309.0, 6758.0, 3563.0, 1820.0, 1088.0, 607.0, 356.0, 218.0, 131.0, 108.0, 53.0, 45.0, 36.0, 17.0, 13.0, 14.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.30078125, -2.2293701171875, -2.157958984375, -2.0865478515625, -2.01513671875, -1.9437255859375, -1.872314453125, -1.8009033203125, -1.7294921875, -1.6580810546875, -1.586669921875, -1.5152587890625, -1.44384765625, -1.3724365234375, -1.301025390625, -1.2296142578125, -1.158203125, -1.0867919921875, -1.015380859375, -0.9439697265625, -0.87255859375, -0.8011474609375, -0.729736328125, -0.6583251953125, -0.5869140625, -0.5155029296875, -0.444091796875, -0.3726806640625, -0.30126953125, -0.2298583984375, -0.158447265625, -0.0870361328125, -0.015625, 0.0557861328125, 0.127197265625, 0.1986083984375, 0.27001953125, 0.3414306640625, 0.412841796875, 0.4842529296875, 0.5556640625, 0.6270751953125, 0.698486328125, 0.7698974609375, 0.84130859375, 0.9127197265625, 0.984130859375, 1.0555419921875, 1.126953125, 1.1983642578125, 1.269775390625, 1.3411865234375, 1.41259765625, 1.4840087890625, 1.555419921875, 1.6268310546875, 1.6982421875, 1.7696533203125, 1.841064453125, 1.9124755859375, 1.98388671875, 2.0552978515625, 2.126708984375, 2.1981201171875, 2.26953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 20.0, 8.0, 12.0, 15.0, 14.0, 22.0, 36.0, 30.0, 37.0, 29.0, 32.0, 33.0, 34.0, 40.0, 46.0, 47.0, 42.0, 51.0, 50.0, 36.0, 39.0, 42.0, 40.0, 21.0, 25.0, 30.0, 14.0, 16.0, 14.0, 17.0, 18.0, 11.0, 6.0, 12.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.9296875, -0.9017715454101562, -0.8738555908203125, -0.8459396362304688, -0.818023681640625, -0.7901077270507812, -0.7621917724609375, -0.7342758178710938, -0.70635986328125, -0.6784439086914062, -0.6505279541015625, -0.6226119995117188, -0.594696044921875, -0.5667800903320312, -0.5388641357421875, -0.5109481811523438, -0.4830322265625, -0.45511627197265625, -0.4272003173828125, -0.39928436279296875, -0.371368408203125, -0.34345245361328125, -0.3155364990234375, -0.28762054443359375, -0.25970458984375, -0.23178863525390625, -0.2038726806640625, -0.17595672607421875, -0.148040771484375, -0.12012481689453125, -0.0922088623046875, -0.06429290771484375, -0.036376953125, -0.00846099853515625, 0.0194549560546875, 0.04737091064453125, 0.075286865234375, 0.10320281982421875, 0.1311187744140625, 0.15903472900390625, 0.18695068359375, 0.21486663818359375, 0.2427825927734375, 0.27069854736328125, 0.298614501953125, 0.32653045654296875, 0.3544464111328125, 0.38236236572265625, 0.4102783203125, 0.43819427490234375, 0.4661102294921875, 0.49402618408203125, 0.521942138671875, 0.5498580932617188, 0.5777740478515625, 0.6056900024414062, 0.63360595703125, 0.6615219116210938, 0.6894378662109375, 0.7173538208007812, 0.745269775390625, 0.7731857299804688, 0.8011016845703125, 0.8290176391601562, 0.85693359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 10.0, 12.0, 17.0, 24.0, 31.0, 40.0, 53.0, 85.0, 125.0, 152.0, 206.0, 331.0, 528.0, 805.0, 1306.0, 2348.0, 4733.0, 12647.0, 48594.0, 259469.0, 593513.0, 89179.0, 20119.0, 6637.0, 3007.0, 1655.0, 974.0, 623.0, 408.0, 251.0, 187.0, 125.0, 98.0, 53.0, 52.0, 37.0, 33.0, 24.0, 11.0, 10.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.537109375, -3.4237060546875, -3.310302734375, -3.1968994140625, -3.08349609375, -2.9700927734375, -2.856689453125, -2.7432861328125, -2.6298828125, -2.5164794921875, -2.403076171875, -2.2896728515625, -2.17626953125, -2.0628662109375, -1.949462890625, -1.8360595703125, -1.72265625, -1.6092529296875, -1.495849609375, -1.3824462890625, -1.26904296875, -1.1556396484375, -1.042236328125, -0.9288330078125, -0.8154296875, -0.7020263671875, -0.588623046875, -0.4752197265625, -0.36181640625, -0.2484130859375, -0.135009765625, -0.0216064453125, 0.091796875, 0.2052001953125, 0.318603515625, 0.4320068359375, 0.54541015625, 0.6588134765625, 0.772216796875, 0.8856201171875, 0.9990234375, 1.1124267578125, 1.225830078125, 1.3392333984375, 1.45263671875, 1.5660400390625, 1.679443359375, 1.7928466796875, 1.90625, 2.0196533203125, 2.133056640625, 2.2464599609375, 2.35986328125, 2.4732666015625, 2.586669921875, 2.7000732421875, 2.8134765625, 2.9268798828125, 3.040283203125, 3.1536865234375, 3.26708984375, 3.3804931640625, 3.493896484375, 3.6072998046875, 3.720703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 16.0, 7.0, 14.0, 17.0, 20.0, 29.0, 31.0, 38.0, 39.0, 47.0, 60.0, 48.0, 59.0, 60.0, 60.0, 64.0, 56.0, 42.0, 36.0, 33.0, 33.0, 30.0, 19.0, 27.0, 22.0, 20.0, 11.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32757568359375, -5.1707763671875, -5.01397705078125, -4.857177734375, -4.70037841796875, -4.5435791015625, -4.38677978515625, -4.22998046875, -4.07318115234375, -3.9163818359375, -3.75958251953125, -3.602783203125, -3.44598388671875, -3.2891845703125, -3.13238525390625, -2.9755859375, -2.81878662109375, -2.6619873046875, -2.50518798828125, -2.348388671875, -2.19158935546875, -2.0347900390625, -1.87799072265625, -1.72119140625, -1.56439208984375, -1.4075927734375, -1.25079345703125, -1.093994140625, -0.93719482421875, -0.7803955078125, -0.62359619140625, -0.466796875, -0.30999755859375, -0.1531982421875, 0.00360107421875, 0.160400390625, 0.31719970703125, 0.4739990234375, 0.63079833984375, 0.78759765625, 0.94439697265625, 1.1011962890625, 1.25799560546875, 1.414794921875, 1.57159423828125, 1.7283935546875, 1.88519287109375, 2.0419921875, 2.19879150390625, 2.3555908203125, 2.51239013671875, 2.669189453125, 2.82598876953125, 2.9827880859375, 3.13958740234375, 3.29638671875, 3.45318603515625, 3.6099853515625, 3.76678466796875, 3.923583984375, 4.08038330078125, 4.2371826171875, 4.39398193359375, 4.55078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 14.0, 15.0, 41.0, 75.0, 166.0, 549.0, 2456.0, 32285.0, 958304.0, 50620.0, 3067.0, 581.0, 209.0, 95.0, 26.0, 22.0, 7.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.482879638671875, -2.38177490234375, -2.280670166015625, -2.1795654296875, -2.078460693359375, -1.97735595703125, -1.876251220703125, -1.775146484375, -1.674041748046875, -1.57293701171875, -1.471832275390625, -1.3707275390625, -1.269622802734375, -1.16851806640625, -1.067413330078125, -0.96630859375, -0.865203857421875, -0.76409912109375, -0.662994384765625, -0.5618896484375, -0.460784912109375, -0.35968017578125, -0.258575439453125, -0.157470703125, -0.056365966796875, 0.04473876953125, 0.145843505859375, 0.2469482421875, 0.348052978515625, 0.44915771484375, 0.550262451171875, 0.6513671875, 0.752471923828125, 0.85357666015625, 0.954681396484375, 1.0557861328125, 1.156890869140625, 1.25799560546875, 1.359100341796875, 1.460205078125, 1.561309814453125, 1.66241455078125, 1.763519287109375, 1.8646240234375, 1.965728759765625, 2.06683349609375, 2.167938232421875, 2.26904296875, 2.370147705078125, 2.47125244140625, 2.572357177734375, 2.6734619140625, 2.774566650390625, 2.87567138671875, 2.976776123046875, 3.077880859375, 3.178985595703125, 3.28009033203125, 3.381195068359375, 3.4822998046875, 3.583404541015625, 3.68450927734375, 3.785614013671875, 3.88671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 24.0, 20.0, 34.0, 52.0, 72.0, 125.0, 163.0, 140.0, 103.0, 78.0, 54.0, 39.0, 24.0, 11.0, 9.0, 12.0, 6.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006084442138671875, -0.0005939304828643799, -0.0005794167518615723, -0.0005649030208587646, -0.000550389289855957, -0.0005358755588531494, -0.0005213618278503418, -0.0005068480968475342, -0.0004923343658447266, -0.00047782063484191895, -0.00046330690383911133, -0.0004487931728363037, -0.0004342794418334961, -0.0004197657108306885, -0.00040525197982788086, -0.00039073824882507324, -0.0003762245178222656, -0.000361710786819458, -0.0003471970558166504, -0.0003326833248138428, -0.00031816959381103516, -0.00030365586280822754, -0.0002891421318054199, -0.0002746284008026123, -0.0002601146697998047, -0.00024560093879699707, -0.00023108720779418945, -0.00021657347679138184, -0.00020205974578857422, -0.0001875460147857666, -0.00017303228378295898, -0.00015851855278015137, -0.00014400482177734375, -0.00012949109077453613, -0.00011497735977172852, -0.0001004636287689209, -8.594989776611328e-05, -7.143616676330566e-05, -5.692243576049805e-05, -4.240870475769043e-05, -2.7894973754882812e-05, -1.3381242752075195e-05, 1.1324882507324219e-06, 1.564621925354004e-05, 3.0159950256347656e-05, 4.4673681259155273e-05, 5.918741226196289e-05, 7.370114326477051e-05, 8.821487426757812e-05, 0.00010272860527038574, 0.00011724233627319336, 0.00013175606727600098, 0.0001462697982788086, 0.0001607835292816162, 0.00017529726028442383, 0.00018981099128723145, 0.00020432472229003906, 0.00021883845329284668, 0.0002333521842956543, 0.0002478659152984619, 0.00026237964630126953, 0.00027689337730407715, 0.00029140710830688477, 0.0003059208393096924, 0.0003204345703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 18.0, 20.0, 21.0, 36.0, 57.0, 90.0, 121.0, 131.0, 220.0, 335.0, 543.0, 952.0, 1760.0, 3531.0, 8749.0, 27526.0, 140490.0, 669361.0, 148433.0, 29300.0, 8741.0, 3652.0, 1728.0, 997.0, 571.0, 344.0, 237.0, 148.0, 100.0, 78.0, 57.0, 48.0, 29.0, 26.0, 11.0, 21.0, 11.0, 7.0, 6.0, 10.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9459762573242188, -0.9139251708984375, -0.8818740844726562, -0.849822998046875, -0.8177719116210938, -0.7857208251953125, -0.7536697387695312, -0.72161865234375, -0.6895675659179688, -0.6575164794921875, -0.6254653930664062, -0.593414306640625, -0.5613632202148438, -0.5293121337890625, -0.49726104736328125, -0.4652099609375, -0.43315887451171875, -0.4011077880859375, -0.36905670166015625, -0.337005615234375, -0.30495452880859375, -0.2729034423828125, -0.24085235595703125, -0.20880126953125, -0.17675018310546875, -0.1446990966796875, -0.11264801025390625, -0.080596923828125, -0.04854583740234375, -0.0164947509765625, 0.01555633544921875, 0.047607421875, 0.07965850830078125, 0.1117095947265625, 0.14376068115234375, 0.175811767578125, 0.20786285400390625, 0.2399139404296875, 0.27196502685546875, 0.30401611328125, 0.33606719970703125, 0.3681182861328125, 0.40016937255859375, 0.432220458984375, 0.46427154541015625, 0.4963226318359375, 0.5283737182617188, 0.5604248046875, 0.5924758911132812, 0.6245269775390625, 0.6565780639648438, 0.688629150390625, 0.7206802368164062, 0.7527313232421875, 0.7847824096679688, 0.81683349609375, 0.8488845825195312, 0.8809356689453125, 0.9129867553710938, 0.945037841796875, 0.9770889282226562, 1.0091400146484375, 1.0411911010742188, 1.0732421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 22.0, 18.0, 36.0, 30.0, 37.0, 42.0, 56.0, 54.0, 59.0, 63.0, 66.0, 71.0, 62.0, 46.0, 46.0, 31.0, 49.0, 29.0, 29.0, 30.0, 14.0, 16.0, 8.0, 3.0, 8.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0048675537109375, -0.971649169921875, -0.9384307861328125, -0.90521240234375, -0.8719940185546875, -0.838775634765625, -0.8055572509765625, -0.7723388671875, -0.7391204833984375, -0.705902099609375, -0.6726837158203125, -0.63946533203125, -0.6062469482421875, -0.573028564453125, -0.5398101806640625, -0.506591796875, -0.4733734130859375, -0.440155029296875, -0.4069366455078125, -0.37371826171875, -0.3404998779296875, -0.307281494140625, -0.2740631103515625, -0.2408447265625, -0.2076263427734375, -0.174407958984375, -0.1411895751953125, -0.10797119140625, -0.0747528076171875, -0.041534423828125, -0.0083160400390625, 0.02490234375, 0.0581207275390625, 0.091339111328125, 0.1245574951171875, 0.15777587890625, 0.1909942626953125, 0.224212646484375, 0.2574310302734375, 0.2906494140625, 0.3238677978515625, 0.357086181640625, 0.3903045654296875, 0.42352294921875, 0.4567413330078125, 0.489959716796875, 0.5231781005859375, 0.556396484375, 0.5896148681640625, 0.622833251953125, 0.6560516357421875, 0.68927001953125, 0.7224884033203125, 0.755706787109375, 0.7889251708984375, 0.8221435546875, 0.8553619384765625, 0.888580322265625, 0.9217987060546875, 0.95501708984375, 0.9882354736328125, 1.021453857421875, 1.0546722412109375, 1.087890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 16.0, 22.0, 35.0, 66.0, 89.0, 126.0, 248.0, 138.0, 94.0, 51.0, 41.0, 21.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.20698165893555, -35.37528610229492, -34.54359436035156, -33.71189880371094, -32.88020324707031, -32.04851150512695, -31.216815948486328, -30.385122299194336, -29.553428649902344, -28.72173500061035, -27.890039443969727, -27.058345794677734, -26.226652145385742, -25.39495849609375, -24.563262939453125, -23.731569290161133, -22.899873733520508, -22.068180084228516, -21.23648452758789, -20.4047908782959, -19.573097229003906, -18.74140167236328, -17.90970802307129, -17.078014373779297, -16.246318817138672, -15.414624214172363, -14.582930564880371, -13.751235961914062, -12.91954231262207, -12.087847709655762, -11.256153106689453, -10.424459457397461, -9.592767715454102, -8.761073112487793, -7.929379463195801, -7.097684860229492, -6.265990734100342, -5.434296607971191, -4.602602005004883, -3.7709078788757324, -2.939213752746582, -2.1075196266174316, -1.2758252620697021, -0.44413089752197266, 0.38756322860717773, 1.2192573547363281, 2.0509519577026367, 2.882646083831787, 3.7143402099609375, 4.546034336090088, 5.377728462219238, 6.209423065185547, 7.041117191314697, 7.872811317443848, 8.704505920410156, 9.536199569702148, 10.367894172668457, 11.199588775634766, 12.031282424926758, 12.862977027893066, 13.694671630859375, 14.526365280151367, 15.358059883117676, 16.189754486083984, 17.021448135375977]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 5.0, 6.0, 16.0, 12.0, 12.0, 18.0, 24.0, 28.0, 26.0, 18.0, 32.0, 38.0, 34.0, 48.0, 62.0, 73.0, 74.0, 73.0, 41.0, 33.0, 41.0, 45.0, 30.0, 33.0, 30.0, 17.0, 19.0, 17.0, 20.0, 10.0, 8.0, 10.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.68695068359375, -16.132951736450195, -15.57895278930664, -15.02495288848877, -14.470953941345215, -13.91695499420166, -13.362955093383789, -12.808956146240234, -12.25495719909668, -11.700958251953125, -11.14695930480957, -10.5929594039917, -10.038960456848145, -9.48496150970459, -8.930961608886719, -8.376962661743164, -7.822963714599609, -7.268964767456055, -6.714965343475342, -6.160965919494629, -5.606966972351074, -5.0529680252075195, -4.498968601226807, -3.944969415664673, -3.390970230102539, -2.8369710445404053, -2.2829718589782715, -1.7289726734161377, -1.174973487854004, -0.6209743022918701, -0.06697511672973633, 0.48702406883239746, 1.0410232543945312, 1.595022439956665, 2.149021625518799, 2.7030208110809326, 3.2570199966430664, 3.8110191822052, 4.365018367767334, 4.919017791748047, 5.473016738891602, 6.027015686035156, 6.581015110015869, 7.135014533996582, 7.689013481140137, 8.243012428283691, 8.797012329101562, 9.351011276245117, 9.905010223388672, 10.459009170532227, 11.013008117675781, 11.567008018493652, 12.121006965637207, 12.675005912780762, 13.229005813598633, 13.783004760742188, 14.337003707885742, 14.891002655029297, 15.445001602172852, 15.999001502990723, 16.553001403808594, 17.10700035095215, 17.660999298095703, 18.214998245239258, 18.768997192382812]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 10.0, 13.0, 17.0, 39.0, 53.0, 70.0, 108.0, 183.0, 309.0, 557.0, 986.0, 1872.0, 3613.0, 7145.0, 15603.0, 39884.0, 145500.0, 955857.0, 2497802.0, 398509.0, 77882.0, 26307.0, 11134.0, 5103.0, 2590.0, 1338.0, 759.0, 417.0, 217.0, 154.0, 95.0, 60.0, 21.0, 21.0, 18.0, 9.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5, -1.4586639404296875, -1.417327880859375, -1.3759918212890625, -1.33465576171875, -1.2933197021484375, -1.251983642578125, -1.2106475830078125, -1.1693115234375, -1.1279754638671875, -1.086639404296875, -1.0453033447265625, -1.00396728515625, -0.9626312255859375, -0.921295166015625, -0.8799591064453125, -0.838623046875, -0.7972869873046875, -0.755950927734375, -0.7146148681640625, -0.67327880859375, -0.6319427490234375, -0.590606689453125, -0.5492706298828125, -0.5079345703125, -0.4665985107421875, -0.425262451171875, -0.3839263916015625, -0.34259033203125, -0.3012542724609375, -0.259918212890625, -0.2185821533203125, -0.17724609375, -0.1359100341796875, -0.094573974609375, -0.0532379150390625, -0.01190185546875, 0.0294342041015625, 0.070770263671875, 0.1121063232421875, 0.1534423828125, 0.1947784423828125, 0.236114501953125, 0.2774505615234375, 0.31878662109375, 0.3601226806640625, 0.401458740234375, 0.4427947998046875, 0.484130859375, 0.5254669189453125, 0.566802978515625, 0.6081390380859375, 0.64947509765625, 0.6908111572265625, 0.732147216796875, 0.7734832763671875, 0.8148193359375, 0.8561553955078125, 0.897491455078125, 0.9388275146484375, 0.98016357421875, 1.0214996337890625, 1.062835693359375, 1.1041717529296875, 1.1455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 5.0, 11.0, 11.0, 13.0, 17.0, 12.0, 9.0, 26.0, 23.0, 24.0, 36.0, 35.0, 39.0, 42.0, 39.0, 39.0, 43.0, 47.0, 43.0, 49.0, 30.0, 55.0, 36.0, 48.0, 34.0, 29.0, 23.0, 26.0, 22.0, 15.0, 23.0, 16.0, 13.0, 7.0, 10.0, 3.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.791656494140625, -0.76397705078125, -0.736297607421875, -0.7086181640625, -0.680938720703125, -0.65325927734375, -0.625579833984375, -0.597900390625, -0.570220947265625, -0.54254150390625, -0.514862060546875, -0.4871826171875, -0.459503173828125, -0.43182373046875, -0.404144287109375, -0.37646484375, -0.348785400390625, -0.32110595703125, -0.293426513671875, -0.2657470703125, -0.238067626953125, -0.21038818359375, -0.182708740234375, -0.155029296875, -0.127349853515625, -0.09967041015625, -0.071990966796875, -0.0443115234375, -0.016632080078125, 0.01104736328125, 0.038726806640625, 0.06640625, 0.094085693359375, 0.12176513671875, 0.149444580078125, 0.1771240234375, 0.204803466796875, 0.23248291015625, 0.260162353515625, 0.287841796875, 0.315521240234375, 0.34320068359375, 0.370880126953125, 0.3985595703125, 0.426239013671875, 0.45391845703125, 0.481597900390625, 0.50927734375, 0.536956787109375, 0.56463623046875, 0.592315673828125, 0.6199951171875, 0.647674560546875, 0.67535400390625, 0.703033447265625, 0.730712890625, 0.758392333984375, 0.78607177734375, 0.813751220703125, 0.8414306640625, 0.869110107421875, 0.89678955078125, 0.924468994140625, 0.9521484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 10.0, 15.0, 10.0, 19.0, 30.0, 52.0, 69.0, 99.0, 126.0, 214.0, 403.0, 730.0, 1248.0, 2516.0, 5627.0, 14633.0, 46800.0, 213970.0, 2914582.0, 848451.0, 101392.0, 26944.0, 8954.0, 3493.0, 1684.0, 871.0, 497.0, 292.0, 181.0, 118.0, 67.0, 54.0, 35.0, 24.0, 22.0, 14.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 3.0, 1.0], "bins": [-2.115234375, -2.054412841796875, -1.99359130859375, -1.932769775390625, -1.8719482421875, -1.811126708984375, -1.75030517578125, -1.689483642578125, -1.628662109375, -1.567840576171875, -1.50701904296875, -1.446197509765625, -1.3853759765625, -1.324554443359375, -1.26373291015625, -1.202911376953125, -1.14208984375, -1.081268310546875, -1.02044677734375, -0.959625244140625, -0.8988037109375, -0.837982177734375, -0.77716064453125, -0.716339111328125, -0.655517578125, -0.594696044921875, -0.53387451171875, -0.473052978515625, -0.4122314453125, -0.351409912109375, -0.29058837890625, -0.229766845703125, -0.1689453125, -0.108123779296875, -0.04730224609375, 0.013519287109375, 0.0743408203125, 0.135162353515625, 0.19598388671875, 0.256805419921875, 0.317626953125, 0.378448486328125, 0.43927001953125, 0.500091552734375, 0.5609130859375, 0.621734619140625, 0.68255615234375, 0.743377685546875, 0.80419921875, 0.865020751953125, 0.92584228515625, 0.986663818359375, 1.0474853515625, 1.108306884765625, 1.16912841796875, 1.229949951171875, 1.290771484375, 1.351593017578125, 1.41241455078125, 1.473236083984375, 1.5340576171875, 1.594879150390625, 1.65570068359375, 1.716522216796875, 1.77734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 5.0, 8.0, 8.0, 19.0, 15.0, 36.0, 44.0, 65.0, 91.0, 167.0, 313.0, 598.0, 1049.0, 732.0, 345.0, 190.0, 143.0, 65.0, 37.0, 42.0, 23.0, 22.0, 17.0, 11.0, 9.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.689453125, -3.596405029296875, -3.50335693359375, -3.410308837890625, -3.3172607421875, -3.224212646484375, -3.13116455078125, -3.038116455078125, -2.945068359375, -2.852020263671875, -2.75897216796875, -2.665924072265625, -2.5728759765625, -2.479827880859375, -2.38677978515625, -2.293731689453125, -2.20068359375, -2.107635498046875, -2.01458740234375, -1.921539306640625, -1.8284912109375, -1.735443115234375, -1.64239501953125, -1.549346923828125, -1.456298828125, -1.363250732421875, -1.27020263671875, -1.177154541015625, -1.0841064453125, -0.991058349609375, -0.89801025390625, -0.804962158203125, -0.7119140625, -0.618865966796875, -0.52581787109375, -0.432769775390625, -0.3397216796875, -0.246673583984375, -0.15362548828125, -0.060577392578125, 0.032470703125, 0.125518798828125, 0.21856689453125, 0.311614990234375, 0.4046630859375, 0.497711181640625, 0.59075927734375, 0.683807373046875, 0.77685546875, 0.869903564453125, 0.96295166015625, 1.055999755859375, 1.1490478515625, 1.242095947265625, 1.33514404296875, 1.428192138671875, 1.521240234375, 1.614288330078125, 1.70733642578125, 1.800384521484375, 1.8934326171875, 1.986480712890625, 2.07952880859375, 2.172576904296875, 2.265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 17.0, 61.0, 367.0, 435.0, 87.0, 15.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.178726196289062, -24.17584800720215, -22.172969818115234, -20.170089721679688, -18.167211532592773, -16.16433334350586, -14.161454200744629, -12.158575057983398, -10.155696868896484, -8.15281867980957, -6.14993953704834, -4.147060871124268, -2.1441822052001953, -0.14130401611328125, 1.8615751266479492, 3.8644542694091797, 5.867332458496094, 7.870211124420166, 9.873089790344238, 11.875968933105469, 13.878847122192383, 15.881725311279297, 17.884605407714844, 19.887483596801758, 21.890361785888672, 23.893239974975586, 25.8961181640625, 27.898998260498047, 29.90187644958496, 31.904754638671875, 33.90763473510742, 35.91051483154297, 37.91338348388672, 39.916263580322266, 41.91913986206055, 43.922019958496094, 45.924896240234375, 47.92777633666992, 49.93065643310547, 51.93353271484375, 53.9364128112793, 55.939292907714844, 57.942169189453125, 59.94504928588867, 61.94792938232422, 63.9508056640625, 65.95368194580078, 67.9565658569336, 69.95944213867188, 71.96231842041016, 73.96520233154297, 75.96807861328125, 77.97095489501953, 79.97383117675781, 81.97671508789062, 83.9795913696289, 85.98246765136719, 87.98534393310547, 89.98822784423828, 91.99110412597656, 93.99398040771484, 95.99685668945312, 97.99974060058594, 100.00261688232422, 102.00550079345703]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 16.0, 16.0, 28.0, 25.0, 36.0, 42.0, 37.0, 55.0, 44.0, 58.0, 62.0, 72.0, 78.0, 58.0, 50.0, 55.0, 48.0, 35.0, 37.0, 23.0, 26.0, 20.0, 10.0, 10.0, 7.0, 9.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.574365615844727, -12.098608016967773, -11.622849464416504, -11.14709186553955, -10.671334266662598, -10.195575714111328, -9.719818115234375, -9.244060516357422, -8.768301963806152, -8.2925443649292, -7.816786289215088, -7.341028213500977, -6.865270137786865, -6.389512062072754, -5.913754463195801, -5.4379963874816895, -4.962238788604736, -4.486480712890625, -4.010723114013672, -3.5349650382995605, -3.059206962585449, -2.583449125289917, -2.1076912879943848, -1.6319332122802734, -1.1561753749847412, -0.6804174184799194, -0.20465952157974243, 0.27109837532043457, 0.7468563318252563, 1.2226142883300781, 1.6983721256256104, 2.1741302013397217, 2.649888038635254, 3.125645875930786, 3.6014039516448975, 4.07716178894043, 4.552919864654541, 5.028677940368652, 5.5044355392456055, 5.980193614959717, 6.455951690673828, 6.9317097663879395, 7.407467365264893, 7.883225440979004, 8.358983039855957, 8.834741592407227, 9.31049919128418, 9.786256790161133, 10.262014389038086, 10.737771987915039, 11.213530540466309, 11.689288139343262, 12.165045738220215, 12.640804290771484, 13.116561889648438, 13.59231948852539, 14.06807804107666, 14.543835639953613, 15.019594192504883, 15.495351791381836, 15.971109390258789, 16.446866989135742, 16.922626495361328, 17.39838409423828, 17.874141693115234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 16.0, 18.0, 26.0, 38.0, 61.0, 66.0, 163.0, 212.0, 369.0, 697.0, 1173.0, 2101.0, 3955.0, 8593.0, 19633.0, 49657.0, 133344.0, 348405.0, 298588.0, 108529.0, 41061.0, 16600.0, 7399.0, 3526.0, 1832.0, 992.0, 568.0, 341.0, 222.0, 126.0, 83.0, 55.0, 38.0, 19.0, 23.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2857666015625, -2.214111328125, -2.1424560546875, -2.07080078125, -1.9991455078125, -1.927490234375, -1.8558349609375, -1.7841796875, -1.7125244140625, -1.640869140625, -1.5692138671875, -1.49755859375, -1.4259033203125, -1.354248046875, -1.2825927734375, -1.2109375, -1.1392822265625, -1.067626953125, -0.9959716796875, -0.92431640625, -0.8526611328125, -0.781005859375, -0.7093505859375, -0.6376953125, -0.5660400390625, -0.494384765625, -0.4227294921875, -0.35107421875, -0.2794189453125, -0.207763671875, -0.1361083984375, -0.064453125, 0.0072021484375, 0.078857421875, 0.1505126953125, 0.22216796875, 0.2938232421875, 0.365478515625, 0.4371337890625, 0.5087890625, 0.5804443359375, 0.652099609375, 0.7237548828125, 0.79541015625, 0.8670654296875, 0.938720703125, 1.0103759765625, 1.08203125, 1.1536865234375, 1.225341796875, 1.2969970703125, 1.36865234375, 1.4403076171875, 1.511962890625, 1.5836181640625, 1.6552734375, 1.7269287109375, 1.798583984375, 1.8702392578125, 1.94189453125, 2.0135498046875, 2.085205078125, 2.1568603515625, 2.228515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 9.0, 8.0, 15.0, 12.0, 12.0, 15.0, 18.0, 22.0, 19.0, 30.0, 35.0, 30.0, 33.0, 45.0, 37.0, 44.0, 37.0, 35.0, 47.0, 44.0, 39.0, 46.0, 38.0, 36.0, 29.0, 43.0, 25.0, 23.0, 22.0, 18.0, 10.0, 20.0, 9.0, 12.0, 19.0, 5.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.775390625, -0.7483978271484375, -0.721405029296875, -0.6944122314453125, -0.66741943359375, -0.6404266357421875, -0.613433837890625, -0.5864410400390625, -0.5594482421875, -0.5324554443359375, -0.505462646484375, -0.4784698486328125, -0.45147705078125, -0.4244842529296875, -0.397491455078125, -0.3704986572265625, -0.343505859375, -0.3165130615234375, -0.289520263671875, -0.2625274658203125, -0.23553466796875, -0.2085418701171875, -0.181549072265625, -0.1545562744140625, -0.1275634765625, -0.1005706787109375, -0.073577880859375, -0.0465850830078125, -0.01959228515625, 0.0074005126953125, 0.034393310546875, 0.0613861083984375, 0.08837890625, 0.1153717041015625, 0.142364501953125, 0.1693572998046875, 0.19635009765625, 0.2233428955078125, 0.250335693359375, 0.2773284912109375, 0.3043212890625, 0.3313140869140625, 0.358306884765625, 0.3852996826171875, 0.41229248046875, 0.4392852783203125, 0.466278076171875, 0.4932708740234375, 0.520263671875, 0.5472564697265625, 0.574249267578125, 0.6012420654296875, 0.62823486328125, 0.6552276611328125, 0.682220458984375, 0.7092132568359375, 0.7362060546875, 0.7631988525390625, 0.790191650390625, 0.8171844482421875, 0.84417724609375, 0.8711700439453125, 0.898162841796875, 0.9251556396484375, 0.9521484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 9.0, 5.0, 12.0, 9.0, 19.0, 28.0, 38.0, 57.0, 77.0, 107.0, 163.0, 270.0, 415.0, 765.0, 1464.0, 3052.0, 8798.0, 40557.0, 352553.0, 574170.0, 49101.0, 9931.0, 3376.0, 1510.0, 757.0, 467.0, 259.0, 171.0, 141.0, 76.0, 45.0, 33.0, 35.0, 18.0, 13.0, 17.0, 14.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.6328125, -4.500640869140625, -4.36846923828125, -4.236297607421875, -4.1041259765625, -3.971954345703125, -3.83978271484375, -3.707611083984375, -3.575439453125, -3.443267822265625, -3.31109619140625, -3.178924560546875, -3.0467529296875, -2.914581298828125, -2.78240966796875, -2.650238037109375, -2.51806640625, -2.385894775390625, -2.25372314453125, -2.121551513671875, -1.9893798828125, -1.857208251953125, -1.72503662109375, -1.592864990234375, -1.460693359375, -1.328521728515625, -1.19635009765625, -1.064178466796875, -0.9320068359375, -0.799835205078125, -0.66766357421875, -0.535491943359375, -0.4033203125, -0.271148681640625, -0.13897705078125, -0.006805419921875, 0.1253662109375, 0.257537841796875, 0.38970947265625, 0.521881103515625, 0.654052734375, 0.786224365234375, 0.91839599609375, 1.050567626953125, 1.1827392578125, 1.314910888671875, 1.44708251953125, 1.579254150390625, 1.71142578125, 1.843597412109375, 1.97576904296875, 2.107940673828125, 2.2401123046875, 2.372283935546875, 2.50445556640625, 2.636627197265625, 2.768798828125, 2.900970458984375, 3.03314208984375, 3.165313720703125, 3.2974853515625, 3.429656982421875, 3.56182861328125, 3.694000244140625, 3.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 17.0, 19.0, 40.0, 31.0, 49.0, 52.0, 65.0, 80.0, 63.0, 62.0, 55.0, 72.0, 67.0, 46.0, 56.0, 47.0, 34.0, 20.0, 25.0, 16.0, 12.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.58203125, -3.41015625, -3.23828125, -3.06640625, -2.89453125, -2.72265625, -2.55078125, -2.37890625, -2.20703125, -2.03515625, -1.86328125, -1.69140625, -1.51953125, -1.34765625, -1.17578125, -1.00390625, -0.83203125, -0.66015625, -0.48828125, -0.31640625, -0.14453125, 0.02734375, 0.19921875, 0.37109375, 0.54296875, 0.71484375, 0.88671875, 1.05859375, 1.23046875, 1.40234375, 1.57421875, 1.74609375, 1.91796875, 2.08984375, 2.26171875, 2.43359375, 2.60546875, 2.77734375, 2.94921875, 3.12109375, 3.29296875, 3.46484375, 3.63671875, 3.80859375, 3.98046875, 4.15234375, 4.32421875, 4.49609375, 4.66796875, 4.83984375, 5.01171875, 5.18359375, 5.35546875, 5.52734375, 5.69921875, 5.87109375, 6.04296875, 6.21484375, 6.38671875, 6.55859375, 6.73046875, 6.90234375, 7.07421875, 7.24609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 6.0, 7.0, 10.0, 11.0, 17.0, 17.0, 38.0, 58.0, 72.0, 117.0, 204.0, 430.0, 928.0, 2449.0, 9781.0, 73085.0, 785000.0, 154532.0, 15834.0, 3560.0, 1225.0, 464.0, 289.0, 133.0, 85.0, 67.0, 39.0, 23.0, 16.0, 16.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.423828125, -1.3788299560546875, -1.333831787109375, -1.2888336181640625, -1.24383544921875, -1.1988372802734375, -1.153839111328125, -1.1088409423828125, -1.0638427734375, -1.0188446044921875, -0.973846435546875, -0.9288482666015625, -0.88385009765625, -0.8388519287109375, -0.793853759765625, -0.7488555908203125, -0.703857421875, -0.6588592529296875, -0.613861083984375, -0.5688629150390625, -0.52386474609375, -0.4788665771484375, -0.433868408203125, -0.3888702392578125, -0.3438720703125, -0.2988739013671875, -0.253875732421875, -0.2088775634765625, -0.16387939453125, -0.1188812255859375, -0.073883056640625, -0.0288848876953125, 0.01611328125, 0.0611114501953125, 0.106109619140625, 0.1511077880859375, 0.19610595703125, 0.2411041259765625, 0.286102294921875, 0.3311004638671875, 0.3760986328125, 0.4210968017578125, 0.466094970703125, 0.5110931396484375, 0.55609130859375, 0.6010894775390625, 0.646087646484375, 0.6910858154296875, 0.736083984375, 0.7810821533203125, 0.826080322265625, 0.8710784912109375, 0.91607666015625, 0.9610748291015625, 1.006072998046875, 1.0510711669921875, 1.0960693359375, 1.1410675048828125, 1.186065673828125, 1.2310638427734375, 1.27606201171875, 1.3210601806640625, 1.366058349609375, 1.4110565185546875, 1.4560546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 8.0, 13.0, 16.0, 10.0, 18.0, 18.0, 38.0, 29.0, 54.0, 49.0, 72.0, 94.0, 98.0, 110.0, 82.0, 65.0, 45.0, 44.0, 30.0, 22.0, 14.0, 9.0, 11.0, 3.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002732276916503906, -0.0002643391489982605, -0.00025545060634613037, -0.00024656206369400024, -0.00023767352104187012, -0.00022878497838974, -0.00021989643573760986, -0.00021100789308547974, -0.0002021193504333496, -0.00019323080778121948, -0.00018434226512908936, -0.00017545372247695923, -0.0001665651798248291, -0.00015767663717269897, -0.00014878809452056885, -0.00013989955186843872, -0.0001310110092163086, -0.00012212246656417847, -0.00011323392391204834, -0.00010434538125991821, -9.545683860778809e-05, -8.656829595565796e-05, -7.767975330352783e-05, -6.87912106513977e-05, -5.990266799926758e-05, -5.101412534713745e-05, -4.2125582695007324e-05, -3.32370400428772e-05, -2.434849739074707e-05, -1.5459954738616943e-05, -6.571412086486816e-06, 2.3171305656433105e-06, 1.1205673217773438e-05, 2.0094215869903564e-05, 2.898275852203369e-05, 3.787130117416382e-05, 4.6759843826293945e-05, 5.564838647842407e-05, 6.45369291305542e-05, 7.342547178268433e-05, 8.231401443481445e-05, 9.120255708694458e-05, 0.00010009109973907471, 0.00010897964239120483, 0.00011786818504333496, 0.0001267567276954651, 0.00013564527034759521, 0.00014453381299972534, 0.00015342235565185547, 0.0001623108983039856, 0.00017119944095611572, 0.00018008798360824585, 0.00018897652626037598, 0.0001978650689125061, 0.00020675361156463623, 0.00021564215421676636, 0.00022453069686889648, 0.0002334192395210266, 0.00024230778217315674, 0.00025119632482528687, 0.000260084867477417, 0.0002689734101295471, 0.00027786195278167725, 0.0002867504954338074, 0.0002956390380859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 5.0, 11.0, 8.0, 18.0, 17.0, 36.0, 38.0, 78.0, 154.0, 274.0, 566.0, 1312.0, 3571.0, 16881.0, 219435.0, 750982.0, 45001.0, 6542.0, 1949.0, 831.0, 357.0, 212.0, 116.0, 48.0, 34.0, 24.0, 21.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5314178466796875, -1.486663818359375, -1.4419097900390625, -1.39715576171875, -1.3524017333984375, -1.307647705078125, -1.2628936767578125, -1.2181396484375, -1.1733856201171875, -1.128631591796875, -1.0838775634765625, -1.03912353515625, -0.9943695068359375, -0.949615478515625, -0.9048614501953125, -0.860107421875, -0.8153533935546875, -0.770599365234375, -0.7258453369140625, -0.68109130859375, -0.6363372802734375, -0.591583251953125, -0.5468292236328125, -0.5020751953125, -0.4573211669921875, -0.412567138671875, -0.3678131103515625, -0.32305908203125, -0.2783050537109375, -0.233551025390625, -0.1887969970703125, -0.14404296875, -0.0992889404296875, -0.054534912109375, -0.0097808837890625, 0.03497314453125, 0.0797271728515625, 0.124481201171875, 0.1692352294921875, 0.2139892578125, 0.2587432861328125, 0.303497314453125, 0.3482513427734375, 0.39300537109375, 0.4377593994140625, 0.482513427734375, 0.5272674560546875, 0.572021484375, 0.6167755126953125, 0.661529541015625, 0.7062835693359375, 0.75103759765625, 0.7957916259765625, 0.840545654296875, 0.8852996826171875, 0.9300537109375, 0.9748077392578125, 1.019561767578125, 1.0643157958984375, 1.10906982421875, 1.1538238525390625, 1.198577880859375, 1.2433319091796875, 1.2880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 15.0, 17.0, 25.0, 42.0, 51.0, 72.0, 93.0, 104.0, 121.0, 110.0, 104.0, 80.0, 52.0, 27.0, 27.0, 25.0, 15.0, 3.0, 7.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.451171875, -2.401702880859375, -2.35223388671875, -2.302764892578125, -2.2532958984375, -2.203826904296875, -2.15435791015625, -2.104888916015625, -2.055419921875, -2.005950927734375, -1.95648193359375, -1.907012939453125, -1.8575439453125, -1.808074951171875, -1.75860595703125, -1.709136962890625, -1.65966796875, -1.610198974609375, -1.56072998046875, -1.511260986328125, -1.4617919921875, -1.412322998046875, -1.36285400390625, -1.313385009765625, -1.263916015625, -1.214447021484375, -1.16497802734375, -1.115509033203125, -1.0660400390625, -1.016571044921875, -0.96710205078125, -0.917633056640625, -0.8681640625, -0.818695068359375, -0.76922607421875, -0.719757080078125, -0.6702880859375, -0.620819091796875, -0.57135009765625, -0.521881103515625, -0.472412109375, -0.422943115234375, -0.37347412109375, -0.324005126953125, -0.2745361328125, -0.225067138671875, -0.17559814453125, -0.126129150390625, -0.07666015625, -0.027191162109375, 0.02227783203125, 0.071746826171875, 0.1212158203125, 0.170684814453125, 0.22015380859375, 0.269622802734375, 0.319091796875, 0.368560791015625, 0.41802978515625, 0.467498779296875, 0.5169677734375, 0.566436767578125, 0.61590576171875, 0.665374755859375, 0.71484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 10.0, 8.0, 8.0, 8.0, 13.0, 30.0, 52.0, 117.0, 189.0, 276.0, 125.0, 77.0, 41.0, 20.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.426483154296875, -24.557722091674805, -23.688961029052734, -22.820199966430664, -21.951438903808594, -21.08267593383789, -20.21391487121582, -19.34515380859375, -18.47639274597168, -17.60763168334961, -16.73887062072754, -15.870108604431152, -15.001347541809082, -14.132586479187012, -13.263824462890625, -12.395063400268555, -11.526302337646484, -10.657541275024414, -9.788780212402344, -8.920018196105957, -8.051257133483887, -7.182496070861816, -6.313734531402588, -5.444972991943359, -4.576211929321289, -3.7074506282806396, -2.8386893272399902, -1.9699280261993408, -1.1011667251586914, -0.2324056625366211, 0.6363558769226074, 1.505117416381836, 2.373880386352539, 3.2426416873931885, 4.111402988433838, 4.980164527893066, 5.848925590515137, 6.717686653137207, 7.5864481925964355, 8.455209732055664, 9.323970794677734, 10.192731857299805, 11.061492919921875, 11.930254936218262, 12.799015998840332, 13.667777061462402, 14.536539077758789, 15.40530014038086, 16.27406120300293, 17.142822265625, 18.01158332824707, 18.88034439086914, 19.749107360839844, 20.61786651611328, 21.486629486083984, 22.355390548706055, 23.224151611328125, 24.092912673950195, 24.961673736572266, 25.830434799194336, 26.699195861816406, 27.56795883178711, 28.43671989440918, 29.30548095703125, 30.17424201965332]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 10.0, 12.0, 8.0, 14.0, 18.0, 11.0, 21.0, 20.0, 25.0, 27.0, 25.0, 22.0, 32.0, 42.0, 45.0, 63.0, 66.0, 67.0, 58.0, 61.0, 43.0, 39.0, 33.0, 31.0, 22.0, 22.0, 18.0, 16.0, 12.0, 18.0, 6.0, 13.0, 16.0, 10.0, 6.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.952184677124023, -13.482481956481934, -13.01278018951416, -12.54307746887207, -12.073375701904297, -11.603672981262207, -11.133970260620117, -10.664268493652344, -10.19456672668457, -9.72486400604248, -9.255162239074707, -8.785459518432617, -8.315757751464844, -7.846055030822754, -7.376352787017822, -6.906650543212891, -6.436947822570801, -5.967245578765869, -5.4975433349609375, -5.027840614318848, -4.558138847351074, -4.088436126708984, -3.6187338829040527, -3.149031639099121, -2.6793293952941895, -2.209627151489258, -1.7399247884750366, -1.2702224254608154, -0.8005201816558838, -0.33081793785095215, 0.1388845443725586, 0.6085867881774902, 1.0782890319824219, 1.5479912757873535, 2.017693519592285, 2.487396001815796, 2.9570982456207275, 3.426800489425659, 3.89650297164917, 4.366205215454102, 4.835907459259033, 5.305609703063965, 5.7753119468688965, 6.245014190673828, 6.714716911315918, 7.184418678283691, 7.654121398925781, 8.123823165893555, 8.593525886535645, 9.063228607177734, 9.532930374145508, 10.002633094787598, 10.472334861755371, 10.942037582397461, 11.411739349365234, 11.881442070007324, 12.351144790649414, 12.820847511291504, 13.290549278259277, 13.760251998901367, 14.22995376586914, 14.69965648651123, 15.16935920715332, 15.639060974121094, 16.108762741088867]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 10.0, 17.0, 26.0, 42.0, 43.0, 100.0, 99.0, 143.0, 255.0, 355.0, 617.0, 1229.0, 2360.0, 4830.0, 11125.0, 32768.0, 185089.0, 2107797.0, 1657682.0, 142503.0, 27958.0, 9977.0, 4261.0, 2161.0, 1069.0, 632.0, 383.0, 225.0, 163.0, 85.0, 77.0, 50.0, 33.0, 27.0, 11.0, 6.0, 10.0, 8.0, 6.0, 4.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.34765625, -1.304107666015625, -1.26055908203125, -1.217010498046875, -1.1734619140625, -1.129913330078125, -1.08636474609375, -1.042816162109375, -0.999267578125, -0.955718994140625, -0.91217041015625, -0.868621826171875, -0.8250732421875, -0.781524658203125, -0.73797607421875, -0.694427490234375, -0.65087890625, -0.607330322265625, -0.56378173828125, -0.520233154296875, -0.4766845703125, -0.433135986328125, -0.38958740234375, -0.346038818359375, -0.302490234375, -0.258941650390625, -0.21539306640625, -0.171844482421875, -0.1282958984375, -0.084747314453125, -0.04119873046875, 0.002349853515625, 0.0458984375, 0.089447021484375, 0.13299560546875, 0.176544189453125, 0.2200927734375, 0.263641357421875, 0.30718994140625, 0.350738525390625, 0.394287109375, 0.437835693359375, 0.48138427734375, 0.524932861328125, 0.5684814453125, 0.612030029296875, 0.65557861328125, 0.699127197265625, 0.74267578125, 0.786224365234375, 0.82977294921875, 0.873321533203125, 0.9168701171875, 0.960418701171875, 1.00396728515625, 1.047515869140625, 1.091064453125, 1.134613037109375, 1.17816162109375, 1.221710205078125, 1.2652587890625, 1.308807373046875, 1.35235595703125, 1.395904541015625, 1.439453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 10.0, 6.0, 5.0, 14.0, 12.0, 12.0, 18.0, 28.0, 23.0, 28.0, 30.0, 33.0, 41.0, 38.0, 47.0, 38.0, 31.0, 41.0, 38.0, 41.0, 43.0, 50.0, 40.0, 39.0, 37.0, 31.0, 26.0, 37.0, 19.0, 26.0, 15.0, 19.0, 10.0, 15.0, 15.0, 10.0, 9.0, 7.0, 2.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8381881713867188, -0.8121185302734375, -0.7860488891601562, -0.759979248046875, -0.7339096069335938, -0.7078399658203125, -0.6817703247070312, -0.65570068359375, -0.6296310424804688, -0.6035614013671875, -0.5774917602539062, -0.551422119140625, -0.5253524780273438, -0.4992828369140625, -0.47321319580078125, -0.4471435546875, -0.42107391357421875, -0.3950042724609375, -0.36893463134765625, -0.342864990234375, -0.31679534912109375, -0.2907257080078125, -0.26465606689453125, -0.23858642578125, -0.21251678466796875, -0.1864471435546875, -0.16037750244140625, -0.134307861328125, -0.10823822021484375, -0.0821685791015625, -0.05609893798828125, -0.030029296875, -0.00395965576171875, 0.0221099853515625, 0.04817962646484375, 0.074249267578125, 0.10031890869140625, 0.1263885498046875, 0.15245819091796875, 0.17852783203125, 0.20459747314453125, 0.2306671142578125, 0.25673675537109375, 0.282806396484375, 0.30887603759765625, 0.3349456787109375, 0.36101531982421875, 0.3870849609375, 0.41315460205078125, 0.4392242431640625, 0.46529388427734375, 0.491363525390625, 0.5174331665039062, 0.5435028076171875, 0.5695724487304688, 0.59564208984375, 0.6217117309570312, 0.6477813720703125, 0.6738510131835938, 0.699920654296875, 0.7259902954101562, 0.7520599365234375, 0.7781295776367188, 0.80419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 13.0, 21.0, 32.0, 58.0, 116.0, 220.0, 499.0, 1294.0, 4324.0, 20560.0, 244331.0, 3795917.0, 107968.0, 13534.0, 3279.0, 1156.0, 463.0, 224.0, 101.0, 61.0, 39.0, 18.0, 15.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.958984375, -3.858428955078125, -3.75787353515625, -3.657318115234375, -3.5567626953125, -3.456207275390625, -3.35565185546875, -3.255096435546875, -3.154541015625, -3.053985595703125, -2.95343017578125, -2.852874755859375, -2.7523193359375, -2.651763916015625, -2.55120849609375, -2.450653076171875, -2.35009765625, -2.249542236328125, -2.14898681640625, -2.048431396484375, -1.9478759765625, -1.847320556640625, -1.74676513671875, -1.646209716796875, -1.545654296875, -1.445098876953125, -1.34454345703125, -1.243988037109375, -1.1434326171875, -1.042877197265625, -0.94232177734375, -0.841766357421875, -0.7412109375, -0.640655517578125, -0.54010009765625, -0.439544677734375, -0.3389892578125, -0.238433837890625, -0.13787841796875, -0.037322998046875, 0.063232421875, 0.163787841796875, 0.26434326171875, 0.364898681640625, 0.4654541015625, 0.566009521484375, 0.66656494140625, 0.767120361328125, 0.86767578125, 0.968231201171875, 1.06878662109375, 1.169342041015625, 1.2698974609375, 1.370452880859375, 1.47100830078125, 1.571563720703125, 1.672119140625, 1.772674560546875, 1.87322998046875, 1.973785400390625, 2.0743408203125, 2.174896240234375, 2.27545166015625, 2.376007080078125, 2.4765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 9.0, 16.0, 12.0, 22.0, 36.0, 55.0, 90.0, 132.0, 323.0, 692.0, 1145.0, 792.0, 309.0, 153.0, 94.0, 57.0, 30.0, 24.0, 20.0, 15.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.676788330078125, -2.59185791015625, -2.506927490234375, -2.4219970703125, -2.337066650390625, -2.25213623046875, -2.167205810546875, -2.082275390625, -1.997344970703125, -1.91241455078125, -1.827484130859375, -1.7425537109375, -1.657623291015625, -1.57269287109375, -1.487762451171875, -1.40283203125, -1.317901611328125, -1.23297119140625, -1.148040771484375, -1.0631103515625, -0.978179931640625, -0.89324951171875, -0.808319091796875, -0.723388671875, -0.638458251953125, -0.55352783203125, -0.468597412109375, -0.3836669921875, -0.298736572265625, -0.21380615234375, -0.128875732421875, -0.0439453125, 0.040985107421875, 0.12591552734375, 0.210845947265625, 0.2957763671875, 0.380706787109375, 0.46563720703125, 0.550567626953125, 0.635498046875, 0.720428466796875, 0.80535888671875, 0.890289306640625, 0.9752197265625, 1.060150146484375, 1.14508056640625, 1.230010986328125, 1.31494140625, 1.399871826171875, 1.48480224609375, 1.569732666015625, 1.6546630859375, 1.739593505859375, 1.82452392578125, 1.909454345703125, 1.994384765625, 2.079315185546875, 2.16424560546875, 2.249176025390625, 2.3341064453125, 2.419036865234375, 2.50396728515625, 2.588897705078125, 2.673828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 20.0, 46.0, 215.0, 394.0, 224.0, 52.0, 12.0, 13.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.07345962524414, -15.891817092895508, -14.710174560546875, -13.528532028198242, -12.34688949584961, -11.165246963500977, -9.983604431152344, -8.801961898803711, -7.620319366455078, -6.438676834106445, -5.2570343017578125, -4.07539176940918, -2.893749237060547, -1.712106704711914, -0.5304641723632812, 0.6511783599853516, 1.8328208923339844, 3.014463424682617, 4.19610595703125, 5.377748489379883, 6.559391021728516, 7.741033554077148, 8.922676086425781, 10.104318618774414, 11.285961151123047, 12.46760368347168, 13.649246215820312, 14.830888748168945, 16.012531280517578, 17.19417381286621, 18.375816345214844, 19.557458877563477, 20.739105224609375, 21.920747756958008, 23.10239028930664, 24.284032821655273, 25.465675354003906, 26.64731788635254, 27.828960418701172, 29.010602951049805, 30.192245483398438, 31.37388801574707, 32.5555305480957, 33.73717498779297, 34.91881561279297, 36.10045623779297, 37.282100677490234, 38.4637451171875, 39.6453857421875, 40.8270263671875, 42.008670806884766, 43.19031524658203, 44.37195587158203, 45.55359649658203, 46.7352409362793, 47.91688537597656, 49.09852600097656, 50.28016662597656, 51.46181106567383, 52.643455505371094, 53.825096130371094, 55.006736755371094, 56.18838119506836, 57.370025634765625, 58.551666259765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 9.0, 10.0, 20.0, 26.0, 23.0, 25.0, 36.0, 31.0, 55.0, 57.0, 65.0, 74.0, 45.0, 56.0, 61.0, 60.0, 66.0, 44.0, 39.0, 42.0, 31.0, 23.0, 32.0, 18.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.715545654296875, -11.338780403137207, -10.962014198303223, -10.585248947143555, -10.20848274230957, -9.831717491149902, -9.454952239990234, -9.07818603515625, -8.701420783996582, -8.324655532836914, -7.94788932800293, -7.571124076843262, -7.1943583488464355, -6.817592620849609, -6.440827369689941, -6.064061641693115, -5.687295913696289, -5.310530185699463, -4.933764457702637, -4.556999206542969, -4.180233478546143, -3.8034677505493164, -3.4267022609710693, -3.0499367713928223, -2.673171043395996, -2.29640531539917, -1.9196398258209229, -1.5428742170333862, -1.1661086082458496, -0.789342999458313, -0.41257739067077637, -0.0358119010925293, 0.3409538269042969, 0.7177194356918335, 1.0944850444793701, 1.4712506532669067, 1.8480162620544434, 2.2247819900512695, 2.6015474796295166, 2.9783129692077637, 3.35507869720459, 3.731844425201416, 4.108610153198242, 4.48537540435791, 4.862141132354736, 5.2389068603515625, 5.6156721115112305, 5.992437839508057, 6.369203567504883, 6.745969295501709, 7.122735023498535, 7.499500274658203, 7.876266002655029, 8.253031730651855, 8.629796981811523, 9.006563186645508, 9.383328437805176, 9.760093688964844, 10.136859893798828, 10.513625144958496, 10.890390396118164, 11.267156600952148, 11.643921852111816, 12.020687103271484, 12.397453308105469]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 7.0, 24.0, 26.0, 48.0, 65.0, 99.0, 144.0, 238.0, 361.0, 585.0, 994.0, 1726.0, 3041.0, 6079.0, 12941.0, 30511.0, 74703.0, 184718.0, 343298.0, 226165.0, 93869.0, 37533.0, 15621.0, 7269.0, 3674.0, 1977.0, 1103.0, 619.0, 417.0, 256.0, 158.0, 97.0, 55.0, 51.0, 26.0, 11.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.376983642578125, -1.32525634765625, -1.273529052734375, -1.2218017578125, -1.170074462890625, -1.11834716796875, -1.066619873046875, -1.014892578125, -0.963165283203125, -0.91143798828125, -0.859710693359375, -0.8079833984375, -0.756256103515625, -0.70452880859375, -0.652801513671875, -0.60107421875, -0.549346923828125, -0.49761962890625, -0.445892333984375, -0.3941650390625, -0.342437744140625, -0.29071044921875, -0.238983154296875, -0.187255859375, -0.135528564453125, -0.08380126953125, -0.032073974609375, 0.0196533203125, 0.071380615234375, 0.12310791015625, 0.174835205078125, 0.2265625, 0.278289794921875, 0.33001708984375, 0.381744384765625, 0.4334716796875, 0.485198974609375, 0.53692626953125, 0.588653564453125, 0.640380859375, 0.692108154296875, 0.74383544921875, 0.795562744140625, 0.8472900390625, 0.899017333984375, 0.95074462890625, 1.002471923828125, 1.05419921875, 1.105926513671875, 1.15765380859375, 1.209381103515625, 1.2611083984375, 1.312835693359375, 1.36456298828125, 1.416290283203125, 1.468017578125, 1.519744873046875, 1.57147216796875, 1.623199462890625, 1.6749267578125, 1.726654052734375, 1.77838134765625, 1.830108642578125, 1.8818359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 13.0, 11.0, 6.0, 11.0, 20.0, 16.0, 21.0, 29.0, 38.0, 26.0, 33.0, 33.0, 42.0, 31.0, 42.0, 33.0, 38.0, 40.0, 40.0, 41.0, 44.0, 56.0, 37.0, 40.0, 23.0, 22.0, 19.0, 27.0, 27.0, 20.0, 15.0, 19.0, 18.0, 5.0, 16.0, 5.0, 9.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.85009765625, -0.82452392578125, -0.7989501953125, -0.77337646484375, -0.747802734375, -0.72222900390625, -0.6966552734375, -0.67108154296875, -0.6455078125, -0.61993408203125, -0.5943603515625, -0.56878662109375, -0.543212890625, -0.51763916015625, -0.4920654296875, -0.46649169921875, -0.44091796875, -0.41534423828125, -0.3897705078125, -0.36419677734375, -0.338623046875, -0.31304931640625, -0.2874755859375, -0.26190185546875, -0.236328125, -0.21075439453125, -0.1851806640625, -0.15960693359375, -0.134033203125, -0.10845947265625, -0.0828857421875, -0.05731201171875, -0.03173828125, -0.00616455078125, 0.0194091796875, 0.04498291015625, 0.070556640625, 0.09613037109375, 0.1217041015625, 0.14727783203125, 0.1728515625, 0.19842529296875, 0.2239990234375, 0.24957275390625, 0.275146484375, 0.30072021484375, 0.3262939453125, 0.35186767578125, 0.37744140625, 0.40301513671875, 0.4285888671875, 0.45416259765625, 0.479736328125, 0.50531005859375, 0.5308837890625, 0.55645751953125, 0.58203125, 0.60760498046875, 0.6331787109375, 0.65875244140625, 0.684326171875, 0.70989990234375, 0.7354736328125, 0.76104736328125, 0.78662109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 10.0, 11.0, 18.0, 29.0, 21.0, 28.0, 32.0, 79.0, 109.0, 199.0, 313.0, 610.0, 1442.0, 3994.0, 14153.0, 65017.0, 446367.0, 430308.0, 64650.0, 14088.0, 4072.0, 1492.0, 602.0, 310.0, 174.0, 120.0, 69.0, 53.0, 41.0, 40.0, 26.0, 19.0, 14.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.396484375, -2.3138427734375, -2.231201171875, -2.1485595703125, -2.06591796875, -1.9832763671875, -1.900634765625, -1.8179931640625, -1.7353515625, -1.6527099609375, -1.570068359375, -1.4874267578125, -1.40478515625, -1.3221435546875, -1.239501953125, -1.1568603515625, -1.07421875, -0.9915771484375, -0.908935546875, -0.8262939453125, -0.74365234375, -0.6610107421875, -0.578369140625, -0.4957275390625, -0.4130859375, -0.3304443359375, -0.247802734375, -0.1651611328125, -0.08251953125, 0.0001220703125, 0.082763671875, 0.1654052734375, 0.248046875, 0.3306884765625, 0.413330078125, 0.4959716796875, 0.57861328125, 0.6612548828125, 0.743896484375, 0.8265380859375, 0.9091796875, 0.9918212890625, 1.074462890625, 1.1571044921875, 1.23974609375, 1.3223876953125, 1.405029296875, 1.4876708984375, 1.5703125, 1.6529541015625, 1.735595703125, 1.8182373046875, 1.90087890625, 1.9835205078125, 2.066162109375, 2.1488037109375, 2.2314453125, 2.3140869140625, 2.396728515625, 2.4793701171875, 2.56201171875, 2.6446533203125, 2.727294921875, 2.8099365234375, 2.892578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 12.0, 15.0, 16.0, 22.0, 22.0, 26.0, 42.0, 35.0, 37.0, 48.0, 47.0, 53.0, 57.0, 51.0, 62.0, 50.0, 43.0, 50.0, 50.0, 43.0, 29.0, 38.0, 19.0, 21.0, 20.0, 15.0, 15.0, 11.0, 5.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.224029541015625, -3.11993408203125, -3.015838623046875, -2.9117431640625, -2.807647705078125, -2.70355224609375, -2.599456787109375, -2.495361328125, -2.391265869140625, -2.28717041015625, -2.183074951171875, -2.0789794921875, -1.974884033203125, -1.87078857421875, -1.766693115234375, -1.66259765625, -1.558502197265625, -1.45440673828125, -1.350311279296875, -1.2462158203125, -1.142120361328125, -1.03802490234375, -0.933929443359375, -0.829833984375, -0.725738525390625, -0.62164306640625, -0.517547607421875, -0.4134521484375, -0.309356689453125, -0.20526123046875, -0.101165771484375, 0.0029296875, 0.107025146484375, 0.21112060546875, 0.315216064453125, 0.4193115234375, 0.523406982421875, 0.62750244140625, 0.731597900390625, 0.835693359375, 0.939788818359375, 1.04388427734375, 1.147979736328125, 1.2520751953125, 1.356170654296875, 1.46026611328125, 1.564361572265625, 1.66845703125, 1.772552490234375, 1.87664794921875, 1.980743408203125, 2.0848388671875, 2.188934326171875, 2.29302978515625, 2.397125244140625, 2.501220703125, 2.605316162109375, 2.70941162109375, 2.813507080078125, 2.9176025390625, 3.021697998046875, 3.12579345703125, 3.229888916015625, 3.333984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 22.0, 18.0, 24.0, 48.0, 82.0, 164.0, 294.0, 660.0, 1821.0, 5890.0, 27403.0, 182467.0, 702981.0, 103218.0, 16943.0, 4056.0, 1351.0, 505.0, 258.0, 147.0, 71.0, 43.0, 20.0, 18.0, 10.0, 11.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7683029174804688, -0.7402191162109375, -0.7121353149414062, -0.684051513671875, -0.6559677124023438, -0.6278839111328125, -0.5998001098632812, -0.57171630859375, -0.5436325073242188, -0.5155487060546875, -0.48746490478515625, -0.459381103515625, -0.43129730224609375, -0.4032135009765625, -0.37512969970703125, -0.3470458984375, -0.31896209716796875, -0.2908782958984375, -0.26279449462890625, -0.234710693359375, -0.20662689208984375, -0.1785430908203125, -0.15045928955078125, -0.12237548828125, -0.09429168701171875, -0.0662078857421875, -0.03812408447265625, -0.010040283203125, 0.01804351806640625, 0.0461273193359375, 0.07421112060546875, 0.102294921875, 0.13037872314453125, 0.1584625244140625, 0.18654632568359375, 0.214630126953125, 0.24271392822265625, 0.2707977294921875, 0.29888153076171875, 0.32696533203125, 0.35504913330078125, 0.3831329345703125, 0.41121673583984375, 0.439300537109375, 0.46738433837890625, 0.4954681396484375, 0.5235519409179688, 0.5516357421875, 0.5797195434570312, 0.6078033447265625, 0.6358871459960938, 0.663970947265625, 0.6920547485351562, 0.7201385498046875, 0.7482223510742188, 0.77630615234375, 0.8043899536132812, 0.8324737548828125, 0.8605575561523438, 0.888641357421875, 0.9167251586914062, 0.9448089599609375, 0.9728927612304688, 1.0009765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 8.0, 15.0, 19.0, 24.0, 38.0, 58.0, 80.0, 107.0, 132.0, 124.0, 119.0, 92.0, 49.0, 32.0, 21.0, 13.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031828880310058594, -0.0003085993230342865, -0.00029890984296798706, -0.0002892203629016876, -0.0002795308828353882, -0.00026984140276908875, -0.0002601519227027893, -0.00025046244263648987, -0.00024077296257019043, -0.000231083482503891, -0.00022139400243759155, -0.00021170452237129211, -0.00020201504230499268, -0.00019232556223869324, -0.0001826360821723938, -0.00017294660210609436, -0.00016325712203979492, -0.00015356764197349548, -0.00014387816190719604, -0.0001341886818408966, -0.00012449920177459717, -0.00011480972170829773, -0.00010512024164199829, -9.543076157569885e-05, -8.574128150939941e-05, -7.605180144309998e-05, -6.636232137680054e-05, -5.66728413105011e-05, -4.698336124420166e-05, -3.729388117790222e-05, -2.7604401111602783e-05, -1.7914921045303345e-05, -8.225440979003906e-06, 1.4640390872955322e-06, 1.115351915359497e-05, 2.084299921989441e-05, 3.053247928619385e-05, 4.0221959352493286e-05, 4.9911439418792725e-05, 5.960091948509216e-05, 6.92903995513916e-05, 7.897987961769104e-05, 8.866935968399048e-05, 9.835883975028992e-05, 0.00010804831981658936, 0.0001177377998828888, 0.00012742727994918823, 0.00013711676001548767, 0.0001468062400817871, 0.00015649572014808655, 0.00016618520021438599, 0.00017587468028068542, 0.00018556416034698486, 0.0001952536404132843, 0.00020494312047958374, 0.00021463260054588318, 0.00022432208061218262, 0.00023401156067848206, 0.0002437010407447815, 0.00025339052081108093, 0.00026308000087738037, 0.0002727694809436798, 0.00028245896100997925, 0.0002921484410762787, 0.0003018379211425781]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 16.0, 12.0, 19.0, 38.0, 55.0, 138.0, 316.0, 837.0, 2704.0, 12402.0, 95218.0, 759548.0, 153990.0, 17957.0, 3542.0, 1015.0, 394.0, 164.0, 72.0, 43.0, 28.0, 19.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2538299560546875, -1.219573974609375, -1.1853179931640625, -1.15106201171875, -1.1168060302734375, -1.082550048828125, -1.0482940673828125, -1.0140380859375, -0.9797821044921875, -0.945526123046875, -0.9112701416015625, -0.87701416015625, -0.8427581787109375, -0.808502197265625, -0.7742462158203125, -0.739990234375, -0.7057342529296875, -0.671478271484375, -0.6372222900390625, -0.60296630859375, -0.5687103271484375, -0.534454345703125, -0.5001983642578125, -0.4659423828125, -0.4316864013671875, -0.397430419921875, -0.3631744384765625, -0.32891845703125, -0.2946624755859375, -0.260406494140625, -0.2261505126953125, -0.19189453125, -0.1576385498046875, -0.123382568359375, -0.0891265869140625, -0.05487060546875, -0.0206146240234375, 0.013641357421875, 0.0478973388671875, 0.0821533203125, 0.1164093017578125, 0.150665283203125, 0.1849212646484375, 0.21917724609375, 0.2534332275390625, 0.287689208984375, 0.3219451904296875, 0.356201171875, 0.3904571533203125, 0.424713134765625, 0.4589691162109375, 0.49322509765625, 0.5274810791015625, 0.561737060546875, 0.5959930419921875, 0.6302490234375, 0.6645050048828125, 0.698760986328125, 0.7330169677734375, 0.76727294921875, 0.8015289306640625, 0.835784912109375, 0.8700408935546875, 0.904296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 13.0, 15.0, 32.0, 20.0, 33.0, 49.0, 48.0, 62.0, 69.0, 82.0, 98.0, 89.0, 75.0, 63.0, 54.0, 46.0, 24.0, 33.0, 21.0, 21.0, 12.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8707733154296875, -0.843109130859375, -0.8154449462890625, -0.78778076171875, -0.7601165771484375, -0.732452392578125, -0.7047882080078125, -0.6771240234375, -0.6494598388671875, -0.621795654296875, -0.5941314697265625, -0.56646728515625, -0.5388031005859375, -0.511138916015625, -0.4834747314453125, -0.455810546875, -0.4281463623046875, -0.400482177734375, -0.3728179931640625, -0.34515380859375, -0.3174896240234375, -0.289825439453125, -0.2621612548828125, -0.2344970703125, -0.2068328857421875, -0.179168701171875, -0.1515045166015625, -0.12384033203125, -0.0961761474609375, -0.068511962890625, -0.0408477783203125, -0.01318359375, 0.0144805908203125, 0.042144775390625, 0.0698089599609375, 0.09747314453125, 0.1251373291015625, 0.152801513671875, 0.1804656982421875, 0.2081298828125, 0.2357940673828125, 0.263458251953125, 0.2911224365234375, 0.31878662109375, 0.3464508056640625, 0.374114990234375, 0.4017791748046875, 0.429443359375, 0.4571075439453125, 0.484771728515625, 0.5124359130859375, 0.54010009765625, 0.5677642822265625, 0.595428466796875, 0.6230926513671875, 0.6507568359375, 0.6784210205078125, 0.706085205078125, 0.7337493896484375, 0.76141357421875, 0.7890777587890625, 0.816741943359375, 0.8444061279296875, 0.8720703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 16.0, 13.0, 36.0, 54.0, 79.0, 128.0, 217.0, 157.0, 93.0, 51.0, 54.0, 34.0, 18.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.331497192382812, -12.849333763122559, -12.367170333862305, -11.885005950927734, -11.40284252166748, -10.920679092407227, -10.438515663146973, -9.956352233886719, -9.474187850952148, -8.992024421691895, -8.50986099243164, -8.02769660949707, -7.545533180236816, -7.0633697509765625, -6.581206321716309, -6.099042892456055, -5.616879463195801, -5.134716033935547, -4.652552127838135, -4.170388698577881, -3.688225030899048, -3.206061363220215, -2.723897933959961, -2.241734266281128, -1.759570598602295, -1.277406930923462, -0.7952433824539185, -0.313079833984375, 0.169083833694458, 0.651247501373291, 1.133410930633545, 1.615574598312378, 2.097738265991211, 2.579901933670044, 3.062065601348877, 3.544229030609131, 4.026392936706543, 4.508556365966797, 4.990719795227051, 5.472883224487305, 5.955047130584717, 6.437210559844971, 6.919374465942383, 7.401537895202637, 7.883701324462891, 8.365865707397461, 8.848028182983398, 9.330192565917969, 9.812355995178223, 10.294519424438477, 10.77668285369873, 11.258846282958984, 11.741010665893555, 12.223174095153809, 12.705337524414062, 13.187500953674316, 13.66966438293457, 14.151827812194824, 14.633991241455078, 15.116155624389648, 15.598319053649902, 16.080482482910156, 16.562644958496094, 17.044809341430664, 17.526973724365234]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 7.0, 12.0, 7.0, 14.0, 18.0, 26.0, 18.0, 27.0, 25.0, 27.0, 31.0, 39.0, 50.0, 46.0, 63.0, 76.0, 65.0, 54.0, 49.0, 29.0, 24.0, 22.0, 26.0, 25.0, 23.0, 22.0, 16.0, 24.0, 16.0, 13.0, 18.0, 5.0, 8.0, 6.0, 5.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.22567367553711, -9.891401290893555, -9.55712890625, -9.222856521606445, -8.88858413696289, -8.554311752319336, -8.220039367675781, -7.885766983032227, -7.551494598388672, -7.217222213745117, -6.8829498291015625, -6.548677444458008, -6.214405059814453, -5.880132675170898, -5.545860290527344, -5.211587905883789, -4.877315044403076, -4.5430426597595215, -4.208770275115967, -3.874497890472412, -3.5402255058288574, -3.2059531211853027, -2.871680498123169, -2.5374081134796143, -2.2031357288360596, -1.8688633441925049, -1.5345909595489502, -1.200318455696106, -0.8660460710525513, -0.5317736864089966, -0.19750118255615234, 0.13677120208740234, 0.47104358673095703, 0.8053159713745117, 1.1395883560180664, 1.4738608598709106, 1.8081332445144653, 2.1424055099487305, 2.4766781330108643, 2.810950517654419, 3.1452229022979736, 3.4794952869415283, 3.813767671585083, 4.148040294647217, 4.4823126792907715, 4.816585063934326, 5.150857448577881, 5.4851298332214355, 5.81940221786499, 6.153674602508545, 6.4879469871521, 6.822219371795654, 7.156491756439209, 7.490764141082764, 7.825037002563477, 8.159309387207031, 8.493581771850586, 8.82785415649414, 9.162126541137695, 9.49639892578125, 9.830671310424805, 10.16494369506836, 10.499216079711914, 10.833488464355469, 11.167760848999023]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 12.0, 21.0, 33.0, 40.0, 54.0, 72.0, 95.0, 135.0, 229.0, 314.0, 544.0, 942.0, 1663.0, 3237.0, 6765.0, 16306.0, 56966.0, 357909.0, 2612663.0, 973137.0, 117845.0, 25971.0, 9667.0, 4363.0, 2145.0, 1252.0, 722.0, 366.0, 259.0, 179.0, 87.0, 61.0, 54.0, 43.0, 33.0, 27.0, 16.0, 10.0, 12.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9733428955078125, -0.936920166015625, -0.9004974365234375, -0.86407470703125, -0.8276519775390625, -0.791229248046875, -0.7548065185546875, -0.7183837890625, -0.6819610595703125, -0.645538330078125, -0.6091156005859375, -0.57269287109375, -0.5362701416015625, -0.499847412109375, -0.4634246826171875, -0.427001953125, -0.3905792236328125, -0.354156494140625, -0.3177337646484375, -0.28131103515625, -0.2448883056640625, -0.208465576171875, -0.1720428466796875, -0.1356201171875, -0.0991973876953125, -0.062774658203125, -0.0263519287109375, 0.01007080078125, 0.0464935302734375, 0.082916259765625, 0.1193389892578125, 0.15576171875, 0.1921844482421875, 0.228607177734375, 0.2650299072265625, 0.30145263671875, 0.3378753662109375, 0.374298095703125, 0.4107208251953125, 0.4471435546875, 0.4835662841796875, 0.519989013671875, 0.5564117431640625, 0.59283447265625, 0.6292572021484375, 0.665679931640625, 0.7021026611328125, 0.738525390625, 0.7749481201171875, 0.811370849609375, 0.8477935791015625, 0.88421630859375, 0.9206390380859375, 0.957061767578125, 0.9934844970703125, 1.0299072265625, 1.0663299560546875, 1.102752685546875, 1.1391754150390625, 1.17559814453125, 1.2120208740234375, 1.248443603515625, 1.2848663330078125, 1.3212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 9.0, 6.0, 5.0, 10.0, 10.0, 11.0, 12.0, 19.0, 20.0, 31.0, 26.0, 31.0, 36.0, 43.0, 34.0, 41.0, 32.0, 31.0, 33.0, 47.0, 35.0, 53.0, 49.0, 39.0, 49.0, 32.0, 32.0, 25.0, 30.0, 20.0, 22.0, 20.0, 17.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.7482147216796875, -0.723968505859375, -0.6997222900390625, -0.67547607421875, -0.6512298583984375, -0.626983642578125, -0.6027374267578125, -0.5784912109375, -0.5542449951171875, -0.529998779296875, -0.5057525634765625, -0.48150634765625, -0.4572601318359375, -0.433013916015625, -0.4087677001953125, -0.384521484375, -0.3602752685546875, -0.336029052734375, -0.3117828369140625, -0.28753662109375, -0.2632904052734375, -0.239044189453125, -0.2147979736328125, -0.1905517578125, -0.1663055419921875, -0.142059326171875, -0.1178131103515625, -0.09356689453125, -0.0693206787109375, -0.045074462890625, -0.0208282470703125, 0.00341796875, 0.0276641845703125, 0.051910400390625, 0.0761566162109375, 0.10040283203125, 0.1246490478515625, 0.148895263671875, 0.1731414794921875, 0.1973876953125, 0.2216339111328125, 0.245880126953125, 0.2701263427734375, 0.29437255859375, 0.3186187744140625, 0.342864990234375, 0.3671112060546875, 0.391357421875, 0.4156036376953125, 0.439849853515625, 0.4640960693359375, 0.48834228515625, 0.5125885009765625, 0.536834716796875, 0.5610809326171875, 0.5853271484375, 0.6095733642578125, 0.633819580078125, 0.6580657958984375, 0.68231201171875, 0.7065582275390625, 0.730804443359375, 0.7550506591796875, 0.779296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 5.0, 2.0, 18.0, 23.0, 28.0, 44.0, 57.0, 125.0, 299.0, 693.0, 2051.0, 7706.0, 46313.0, 2200385.0, 1882987.0, 42966.0, 7302.0, 1976.0, 645.0, 290.0, 141.0, 74.0, 42.0, 28.0, 29.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.984375, -2.899078369140625, -2.81378173828125, -2.728485107421875, -2.6431884765625, -2.557891845703125, -2.47259521484375, -2.387298583984375, -2.302001953125, -2.216705322265625, -2.13140869140625, -2.046112060546875, -1.9608154296875, -1.875518798828125, -1.79022216796875, -1.704925537109375, -1.61962890625, -1.534332275390625, -1.44903564453125, -1.363739013671875, -1.2784423828125, -1.193145751953125, -1.10784912109375, -1.022552490234375, -0.937255859375, -0.851959228515625, -0.76666259765625, -0.681365966796875, -0.5960693359375, -0.510772705078125, -0.42547607421875, -0.340179443359375, -0.2548828125, -0.169586181640625, -0.08428955078125, 0.001007080078125, 0.0863037109375, 0.171600341796875, 0.25689697265625, 0.342193603515625, 0.427490234375, 0.512786865234375, 0.59808349609375, 0.683380126953125, 0.7686767578125, 0.853973388671875, 0.93927001953125, 1.024566650390625, 1.10986328125, 1.195159912109375, 1.28045654296875, 1.365753173828125, 1.4510498046875, 1.536346435546875, 1.62164306640625, 1.706939697265625, 1.792236328125, 1.877532958984375, 1.96282958984375, 2.048126220703125, 2.1334228515625, 2.218719482421875, 2.30401611328125, 2.389312744140625, 2.474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 3.0, 10.0, 26.0, 17.0, 23.0, 47.0, 68.0, 103.0, 212.0, 469.0, 979.0, 1059.0, 517.0, 218.0, 119.0, 63.0, 45.0, 23.0, 22.0, 8.0, 11.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9129791259765625, -1.836700439453125, -1.7604217529296875, -1.68414306640625, -1.6078643798828125, -1.531585693359375, -1.4553070068359375, -1.3790283203125, -1.3027496337890625, -1.226470947265625, -1.1501922607421875, -1.07391357421875, -0.9976348876953125, -0.921356201171875, -0.8450775146484375, -0.768798828125, -0.6925201416015625, -0.616241455078125, -0.5399627685546875, -0.46368408203125, -0.3874053955078125, -0.311126708984375, -0.2348480224609375, -0.1585693359375, -0.0822906494140625, -0.006011962890625, 0.0702667236328125, 0.14654541015625, 0.2228240966796875, 0.299102783203125, 0.3753814697265625, 0.45166015625, 0.5279388427734375, 0.604217529296875, 0.6804962158203125, 0.75677490234375, 0.8330535888671875, 0.909332275390625, 0.9856109619140625, 1.0618896484375, 1.1381683349609375, 1.214447021484375, 1.2907257080078125, 1.36700439453125, 1.4432830810546875, 1.519561767578125, 1.5958404541015625, 1.672119140625, 1.7483978271484375, 1.824676513671875, 1.9009552001953125, 1.97723388671875, 2.0535125732421875, 2.129791259765625, 2.2060699462890625, 2.2823486328125, 2.3586273193359375, 2.434906005859375, 2.5111846923828125, 2.58746337890625, 2.6637420654296875, 2.740020751953125, 2.8162994384765625, 2.892578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 15.0, 22.0, 47.0, 85.0, 167.0, 257.0, 192.0, 93.0, 62.0, 24.0, 13.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.713455200195312, -20.100908279418945, -19.48836326599121, -18.875816345214844, -18.26327133178711, -17.650724411010742, -17.038177490234375, -16.42563247680664, -15.813085556030273, -15.200539588928223, -14.587993621826172, -13.975446701049805, -13.362900733947754, -12.750354766845703, -12.137808799743652, -11.525262832641602, -10.91271686553955, -10.3001708984375, -9.68762493133545, -9.075078964233398, -8.462532043457031, -7.8499860763549805, -7.23744010925293, -6.624893665313721, -6.01234769821167, -5.399801731109619, -4.78725528717041, -4.174709320068359, -3.5621631145477295, -2.9496169090270996, -2.337070941925049, -1.7245244979858398, -1.111978530883789, -0.49943238496780396, 0.11311376094818115, 0.7256598472595215, 1.3382060527801514, 1.9507522583007812, 2.563298225402832, 3.175844669342041, 3.788390636444092, 4.400936603546143, 5.013483047485352, 5.626029014587402, 6.238574981689453, 6.851121425628662, 7.463667392730713, 8.076213836669922, 8.688759803771973, 9.301305770874023, 9.913851737976074, 10.526397705078125, 11.138944625854492, 11.751490592956543, 12.364036560058594, 12.976583480834961, 13.589128494262695, 14.201674461364746, 14.814220428466797, 15.426767349243164, 16.0393123626709, 16.651859283447266, 17.264404296875, 17.876951217651367, 18.489498138427734]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 13.0, 17.0, 14.0, 13.0, 18.0, 19.0, 24.0, 32.0, 26.0, 45.0, 44.0, 42.0, 49.0, 52.0, 45.0, 57.0, 42.0, 66.0, 35.0, 44.0, 46.0, 31.0, 43.0, 29.0, 31.0, 24.0, 14.0, 16.0, 11.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.31397819519043, -9.049446105957031, -8.784913063049316, -8.520380973815918, -8.255847930908203, -7.991315841674805, -7.726783275604248, -7.462250709533691, -7.197718143463135, -6.933185577392578, -6.6686530113220215, -6.404120445251465, -6.139588356018066, -5.875055313110352, -5.610523223876953, -5.3459906578063965, -5.08145809173584, -4.816925525665283, -4.552392959594727, -4.28786039352417, -4.023327827453613, -3.7587954998016357, -3.494263172149658, -3.2297306060791016, -2.965198040008545, -2.7006654739379883, -2.4361329078674316, -2.171600580215454, -1.9070680141448975, -1.6425354480743408, -1.3780030012130737, -1.1134705543518066, -0.8489370346069336, -0.5844045281410217, -0.31987202167510986, -0.055339515209198, 0.20919299125671387, 0.4737255573272705, 0.7382580041885376, 1.0027904510498047, 1.2673230171203613, 1.531855583190918, 1.796388030052185, 2.060920476913452, 2.325453042984009, 2.5899856090545654, 2.854517936706543, 3.1190505027770996, 3.3835830688476562, 3.648115634918213, 3.9126482009887695, 4.177180767059326, 4.441713333129883, 4.706245422363281, 4.970777988433838, 5.2353105545043945, 5.499843120574951, 5.764375686645508, 6.0289082527160645, 6.293440818786621, 6.5579729080200195, 6.822505950927734, 7.087038040161133, 7.3515706062316895, 7.616103172302246]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 18.0, 23.0, 37.0, 54.0, 76.0, 114.0, 175.0, 206.0, 333.0, 520.0, 805.0, 1312.0, 2234.0, 3750.0, 6773.0, 12748.0, 25508.0, 54246.0, 122987.0, 276508.0, 291662.0, 132540.0, 57889.0, 27259.0, 13629.0, 7072.0, 3866.0, 2334.0, 1352.0, 850.0, 534.0, 375.0, 231.0, 168.0, 107.0, 77.0, 41.0, 36.0, 23.0, 22.0, 10.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134124755859375, -1.09637451171875, -1.058624267578125, -1.0208740234375, -0.983123779296875, -0.94537353515625, -0.907623291015625, -0.869873046875, -0.832122802734375, -0.79437255859375, -0.756622314453125, -0.7188720703125, -0.681121826171875, -0.64337158203125, -0.605621337890625, -0.56787109375, -0.530120849609375, -0.49237060546875, -0.454620361328125, -0.4168701171875, -0.379119873046875, -0.34136962890625, -0.303619384765625, -0.265869140625, -0.228118896484375, -0.19036865234375, -0.152618408203125, -0.1148681640625, -0.077117919921875, -0.03936767578125, -0.001617431640625, 0.0361328125, 0.073883056640625, 0.11163330078125, 0.149383544921875, 0.1871337890625, 0.224884033203125, 0.26263427734375, 0.300384521484375, 0.338134765625, 0.375885009765625, 0.41363525390625, 0.451385498046875, 0.4891357421875, 0.526885986328125, 0.56463623046875, 0.602386474609375, 0.64013671875, 0.677886962890625, 0.71563720703125, 0.753387451171875, 0.7911376953125, 0.828887939453125, 0.86663818359375, 0.904388427734375, 0.942138671875, 0.979888916015625, 1.01763916015625, 1.055389404296875, 1.0931396484375, 1.130889892578125, 1.16864013671875, 1.206390380859375, 1.244140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 15.0, 10.0, 15.0, 13.0, 11.0, 15.0, 15.0, 32.0, 32.0, 21.0, 29.0, 36.0, 29.0, 40.0, 35.0, 35.0, 38.0, 51.0, 42.0, 37.0, 34.0, 48.0, 37.0, 43.0, 35.0, 30.0, 27.0, 15.0, 26.0, 22.0, 24.0, 23.0, 15.0, 11.0, 11.0, 6.0, 7.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.71044921875, -0.68707275390625, -0.6636962890625, -0.64031982421875, -0.616943359375, -0.59356689453125, -0.5701904296875, -0.54681396484375, -0.5234375, -0.50006103515625, -0.4766845703125, -0.45330810546875, -0.429931640625, -0.40655517578125, -0.3831787109375, -0.35980224609375, -0.33642578125, -0.31304931640625, -0.2896728515625, -0.26629638671875, -0.242919921875, -0.21954345703125, -0.1961669921875, -0.17279052734375, -0.1494140625, -0.12603759765625, -0.1026611328125, -0.07928466796875, -0.055908203125, -0.03253173828125, -0.0091552734375, 0.01422119140625, 0.03759765625, 0.06097412109375, 0.0843505859375, 0.10772705078125, 0.131103515625, 0.15447998046875, 0.1778564453125, 0.20123291015625, 0.224609375, 0.24798583984375, 0.2713623046875, 0.29473876953125, 0.318115234375, 0.34149169921875, 0.3648681640625, 0.38824462890625, 0.41162109375, 0.43499755859375, 0.4583740234375, 0.48175048828125, 0.505126953125, 0.52850341796875, 0.5518798828125, 0.57525634765625, 0.5986328125, 0.62200927734375, 0.6453857421875, 0.66876220703125, 0.692138671875, 0.71551513671875, 0.7388916015625, 0.76226806640625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 7.0, 9.0, 10.0, 17.0, 33.0, 38.0, 40.0, 75.0, 127.0, 146.0, 224.0, 432.0, 711.0, 1320.0, 2794.0, 7078.0, 24227.0, 114454.0, 689434.0, 160329.0, 31500.0, 8855.0, 3260.0, 1444.0, 759.0, 432.0, 266.0, 160.0, 117.0, 76.0, 40.0, 35.0, 25.0, 19.0, 19.0, 7.0, 6.0, 5.0, 6.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.326171875, -2.2589263916015625, -2.191680908203125, -2.1244354248046875, -2.05718994140625, -1.9899444580078125, -1.922698974609375, -1.8554534912109375, -1.7882080078125, -1.7209625244140625, -1.653717041015625, -1.5864715576171875, -1.51922607421875, -1.4519805908203125, -1.384735107421875, -1.3174896240234375, -1.250244140625, -1.1829986572265625, -1.115753173828125, -1.0485076904296875, -0.98126220703125, -0.9140167236328125, -0.846771240234375, -0.7795257568359375, -0.7122802734375, -0.6450347900390625, -0.577789306640625, -0.5105438232421875, -0.44329833984375, -0.3760528564453125, -0.308807373046875, -0.2415618896484375, -0.17431640625, -0.1070709228515625, -0.039825439453125, 0.0274200439453125, 0.09466552734375, 0.1619110107421875, 0.229156494140625, 0.2964019775390625, 0.3636474609375, 0.4308929443359375, 0.498138427734375, 0.5653839111328125, 0.63262939453125, 0.6998748779296875, 0.767120361328125, 0.8343658447265625, 0.901611328125, 0.9688568115234375, 1.036102294921875, 1.1033477783203125, 1.17059326171875, 1.2378387451171875, 1.305084228515625, 1.3723297119140625, 1.4395751953125, 1.5068206787109375, 1.574066162109375, 1.6413116455078125, 1.70855712890625, 1.7758026123046875, 1.843048095703125, 1.9102935791015625, 1.9775390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 12.0, 9.0, 24.0, 30.0, 29.0, 41.0, 50.0, 53.0, 53.0, 59.0, 62.0, 66.0, 62.0, 53.0, 52.0, 48.0, 56.0, 46.0, 30.0, 30.0, 32.0, 19.0, 13.0, 15.0, 7.0, 1.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.2265625, -4.115997314453125, -4.00543212890625, -3.894866943359375, -3.7843017578125, -3.673736572265625, -3.56317138671875, -3.452606201171875, -3.342041015625, -3.231475830078125, -3.12091064453125, -3.010345458984375, -2.8997802734375, -2.789215087890625, -2.67864990234375, -2.568084716796875, -2.45751953125, -2.346954345703125, -2.23638916015625, -2.125823974609375, -2.0152587890625, -1.904693603515625, -1.79412841796875, -1.683563232421875, -1.572998046875, -1.462432861328125, -1.35186767578125, -1.241302490234375, -1.1307373046875, -1.020172119140625, -0.90960693359375, -0.799041748046875, -0.6884765625, -0.577911376953125, -0.46734619140625, -0.356781005859375, -0.2462158203125, -0.135650634765625, -0.02508544921875, 0.085479736328125, 0.196044921875, 0.306610107421875, 0.41717529296875, 0.527740478515625, 0.6383056640625, 0.748870849609375, 0.85943603515625, 0.970001220703125, 1.08056640625, 1.191131591796875, 1.30169677734375, 1.412261962890625, 1.5228271484375, 1.633392333984375, 1.74395751953125, 1.854522705078125, 1.965087890625, 2.075653076171875, 2.18621826171875, 2.296783447265625, 2.4073486328125, 2.517913818359375, 2.62847900390625, 2.739044189453125, 2.849609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 9.0, 11.0, 10.0, 16.0, 26.0, 46.0, 65.0, 108.0, 181.0, 341.0, 703.0, 1593.0, 4422.0, 15898.0, 81536.0, 753646.0, 153973.0, 25429.0, 6518.0, 2120.0, 904.0, 420.0, 204.0, 120.0, 70.0, 63.0, 48.0, 23.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6773529052734375, -0.654510498046875, -0.6316680908203125, -0.60882568359375, -0.5859832763671875, -0.563140869140625, -0.5402984619140625, -0.5174560546875, -0.4946136474609375, -0.471771240234375, -0.4489288330078125, -0.42608642578125, -0.4032440185546875, -0.380401611328125, -0.3575592041015625, -0.334716796875, -0.3118743896484375, -0.289031982421875, -0.2661895751953125, -0.24334716796875, -0.2205047607421875, -0.197662353515625, -0.1748199462890625, -0.1519775390625, -0.1291351318359375, -0.106292724609375, -0.0834503173828125, -0.06060791015625, -0.0377655029296875, -0.014923095703125, 0.0079193115234375, 0.03076171875, 0.0536041259765625, 0.076446533203125, 0.0992889404296875, 0.12213134765625, 0.1449737548828125, 0.167816162109375, 0.1906585693359375, 0.2135009765625, 0.2363433837890625, 0.259185791015625, 0.2820281982421875, 0.30487060546875, 0.3277130126953125, 0.350555419921875, 0.3733978271484375, 0.396240234375, 0.4190826416015625, 0.441925048828125, 0.4647674560546875, 0.48760986328125, 0.5104522705078125, 0.533294677734375, 0.5561370849609375, 0.5789794921875, 0.6018218994140625, 0.624664306640625, 0.6475067138671875, 0.67034912109375, 0.6931915283203125, 0.716033935546875, 0.7388763427734375, 0.76171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 9.0, 2.0, 8.0, 16.0, 12.0, 17.0, 22.0, 31.0, 35.0, 61.0, 40.0, 66.0, 95.0, 123.0, 111.0, 65.0, 58.0, 44.0, 39.0, 24.0, 21.0, 20.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014162063598632812, -0.000136692076921463, -0.0001317635178565979, -0.0001268349587917328, -0.00012190639972686768, -0.00011697784066200256, -0.00011204928159713745, -0.00010712072253227234, -0.00010219216346740723, -9.726360440254211e-05, -9.2335045337677e-05, -8.740648627281189e-05, -8.247792720794678e-05, -7.754936814308167e-05, -7.262080907821655e-05, -6.769225001335144e-05, -6.276369094848633e-05, -5.7835131883621216e-05, -5.2906572818756104e-05, -4.797801375389099e-05, -4.304945468902588e-05, -3.8120895624160767e-05, -3.3192336559295654e-05, -2.8263777494430542e-05, -2.333521842956543e-05, -1.8406659364700317e-05, -1.3478100299835205e-05, -8.549541234970093e-06, -3.6209821701049805e-06, 1.3075768947601318e-06, 6.236135959625244e-06, 1.1164695024490356e-05, 1.609325408935547e-05, 2.102181315422058e-05, 2.5950372219085693e-05, 3.0878931283950806e-05, 3.580749034881592e-05, 4.073604941368103e-05, 4.566460847854614e-05, 5.0593167543411255e-05, 5.552172660827637e-05, 6.045028567314148e-05, 6.537884473800659e-05, 7.03074038028717e-05, 7.523596286773682e-05, 8.016452193260193e-05, 8.509308099746704e-05, 9.002164006233215e-05, 9.495019912719727e-05, 9.987875819206238e-05, 0.00010480731725692749, 0.0001097358763217926, 0.00011466443538665771, 0.00011959299445152283, 0.00012452155351638794, 0.00012945011258125305, 0.00013437867164611816, 0.00013930723071098328, 0.0001442357897758484, 0.0001491643488407135, 0.0001540929079055786, 0.00015902146697044373, 0.00016395002603530884, 0.00016887858510017395, 0.00017380714416503906]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 7.0, 5.0, 10.0, 18.0, 20.0, 43.0, 56.0, 123.0, 257.0, 411.0, 868.0, 2144.0, 6215.0, 26524.0, 232395.0, 715770.0, 49013.0, 9515.0, 2799.0, 1137.0, 541.0, 279.0, 153.0, 84.0, 48.0, 30.0, 25.0, 20.0, 6.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7664260864257812, -0.7418365478515625, -0.7172470092773438, -0.692657470703125, -0.6680679321289062, -0.6434783935546875, -0.6188888549804688, -0.59429931640625, -0.5697097778320312, -0.5451202392578125, -0.5205307006835938, -0.495941162109375, -0.47135162353515625, -0.4467620849609375, -0.42217254638671875, -0.3975830078125, -0.37299346923828125, -0.3484039306640625, -0.32381439208984375, -0.299224853515625, -0.27463531494140625, -0.2500457763671875, -0.22545623779296875, -0.20086669921875, -0.17627716064453125, -0.1516876220703125, -0.12709808349609375, -0.102508544921875, -0.07791900634765625, -0.0533294677734375, -0.02873992919921875, -0.004150390625, 0.02043914794921875, 0.0450286865234375, 0.06961822509765625, 0.094207763671875, 0.11879730224609375, 0.1433868408203125, 0.16797637939453125, 0.19256591796875, 0.21715545654296875, 0.2417449951171875, 0.26633453369140625, 0.290924072265625, 0.31551361083984375, 0.3401031494140625, 0.36469268798828125, 0.3892822265625, 0.41387176513671875, 0.4384613037109375, 0.46305084228515625, 0.487640380859375, 0.5122299194335938, 0.5368194580078125, 0.5614089965820312, 0.58599853515625, 0.6105880737304688, 0.6351776123046875, 0.6597671508789062, 0.684356689453125, 0.7089462280273438, 0.7335357666015625, 0.7581253051757812, 0.78271484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 15.0, 13.0, 37.0, 57.0, 85.0, 140.0, 180.0, 148.0, 105.0, 71.0, 41.0, 35.0, 22.0, 19.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1321258544921875, -1.095306396484375, -1.0584869384765625, -1.02166748046875, -0.9848480224609375, -0.948028564453125, -0.9112091064453125, -0.8743896484375, -0.8375701904296875, -0.800750732421875, -0.7639312744140625, -0.72711181640625, -0.6902923583984375, -0.653472900390625, -0.6166534423828125, -0.579833984375, -0.5430145263671875, -0.506195068359375, -0.4693756103515625, -0.43255615234375, -0.3957366943359375, -0.358917236328125, -0.3220977783203125, -0.2852783203125, -0.2484588623046875, -0.211639404296875, -0.1748199462890625, -0.13800048828125, -0.1011810302734375, -0.064361572265625, -0.0275421142578125, 0.00927734375, 0.0460968017578125, 0.082916259765625, 0.1197357177734375, 0.15655517578125, 0.1933746337890625, 0.230194091796875, 0.2670135498046875, 0.3038330078125, 0.3406524658203125, 0.377471923828125, 0.4142913818359375, 0.45111083984375, 0.4879302978515625, 0.524749755859375, 0.5615692138671875, 0.598388671875, 0.6352081298828125, 0.672027587890625, 0.7088470458984375, 0.74566650390625, 0.7824859619140625, 0.819305419921875, 0.8561248779296875, 0.8929443359375, 0.9297637939453125, 0.966583251953125, 1.0034027099609375, 1.04022216796875, 1.0770416259765625, 1.113861083984375, 1.1506805419921875, 1.1875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 16.0, 21.0, 30.0, 55.0, 87.0, 148.0, 264.0, 126.0, 83.0, 54.0, 28.0, 22.0, 21.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-16.689308166503906, -16.253013610839844, -15.816718101501465, -15.380422592163086, -14.944127082824707, -14.507831573486328, -14.071537017822266, -13.635241508483887, -13.198945999145508, -12.762650489807129, -12.326355934143066, -11.890060424804688, -11.453764915466309, -11.01746940612793, -10.581174850463867, -10.144879341125488, -9.70858383178711, -9.27228832244873, -8.835993766784668, -8.399698257446289, -7.96340274810791, -7.5271077156066895, -7.090812683105469, -6.65451717376709, -6.218222618103027, -5.781927585601807, -5.345632076263428, -4.909337043762207, -4.473041534423828, -4.036746501922607, -3.6004512310028076, -3.164155960083008, -2.727860450744629, -2.291565179824829, -1.8552699089050293, -1.418974757194519, -0.9826794862747192, -0.546384334564209, -0.11008906364440918, 0.3262062072753906, 0.7625014781951904, 1.1987967491149902, 1.63509202003479, 2.07138729095459, 2.5076823234558105, 2.9439775943756104, 3.38027286529541, 3.81656813621521, 4.25286340713501, 4.6891584396362305, 5.125453948974609, 5.56174898147583, 5.998044490814209, 6.43433952331543, 6.870635032653809, 7.306930065155029, 7.74322509765625, 8.179520606994629, 8.615815162658691, 9.05211067199707, 9.48840618133545, 9.924701690673828, 10.36099624633789, 10.79729175567627, 11.233587265014648]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 10.0, 10.0, 11.0, 15.0, 31.0, 15.0, 28.0, 23.0, 23.0, 36.0, 42.0, 45.0, 54.0, 60.0, 116.0, 93.0, 49.0, 44.0, 39.0, 30.0, 27.0, 28.0, 31.0, 22.0, 13.0, 8.0, 12.0, 14.0, 14.0, 8.0, 11.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-13.936079025268555, -13.544151306152344, -13.152223587036133, -12.760295867919922, -12.368367195129395, -11.976439476013184, -11.584511756896973, -11.192584037780762, -10.800655364990234, -10.408727645874023, -10.016799926757812, -9.624872207641602, -9.232943534851074, -8.841015815734863, -8.449088096618652, -8.057160377502441, -7.6652326583862305, -7.2733049392700195, -6.88137674331665, -6.4894490242004395, -6.09752082824707, -5.705593109130859, -5.313665390014648, -4.9217376708984375, -4.529809474945068, -4.137881755828857, -3.7459535598754883, -3.3540258407592773, -2.9620978832244873, -2.5701699256896973, -2.1782422065734863, -1.7863142490386963, -1.3943853378295898, -1.0024573802947998, -0.6105295419692993, -0.21860170364379883, 0.1733262538909912, 0.5652542114257812, 0.9571819305419922, 1.3491098880767822, 1.7410378456115723, 2.1329658031463623, 2.5248937606811523, 2.9168214797973633, 3.3087494373321533, 3.7006773948669434, 4.092605113983154, 4.484533309936523, 4.876461029052734, 5.268388748168945, 5.6603169441223145, 6.052244663238525, 6.4441728591918945, 6.8361005783081055, 7.228028297424316, 7.619956016540527, 8.011884689331055, 8.403812408447266, 8.795740127563477, 9.187667846679688, 9.579596519470215, 9.971524238586426, 10.363451957702637, 10.755379676818848, 11.147307395935059]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 18.0, 14.0, 27.0, 27.0, 52.0, 73.0, 123.0, 190.0, 335.0, 597.0, 1075.0, 2230.0, 5053.0, 14265.0, 58412.0, 451304.0, 2717467.0, 816972.0, 94100.0, 19588.0, 6541.0, 2811.0, 1307.0, 659.0, 368.0, 227.0, 137.0, 82.0, 56.0, 57.0, 34.0, 20.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.111328125, -1.073822021484375, -1.03631591796875, -0.998809814453125, -0.9613037109375, -0.923797607421875, -0.88629150390625, -0.848785400390625, -0.811279296875, -0.773773193359375, -0.73626708984375, -0.698760986328125, -0.6612548828125, -0.623748779296875, -0.58624267578125, -0.548736572265625, -0.51123046875, -0.473724365234375, -0.43621826171875, -0.398712158203125, -0.3612060546875, -0.323699951171875, -0.28619384765625, -0.248687744140625, -0.211181640625, -0.173675537109375, -0.13616943359375, -0.098663330078125, -0.0611572265625, -0.023651123046875, 0.01385498046875, 0.051361083984375, 0.0888671875, 0.126373291015625, 0.16387939453125, 0.201385498046875, 0.2388916015625, 0.276397705078125, 0.31390380859375, 0.351409912109375, 0.388916015625, 0.426422119140625, 0.46392822265625, 0.501434326171875, 0.5389404296875, 0.576446533203125, 0.61395263671875, 0.651458740234375, 0.68896484375, 0.726470947265625, 0.76397705078125, 0.801483154296875, 0.8389892578125, 0.876495361328125, 0.91400146484375, 0.951507568359375, 0.989013671875, 1.026519775390625, 1.06402587890625, 1.101531982421875, 1.1390380859375, 1.176544189453125, 1.21405029296875, 1.251556396484375, 1.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 14.0, 11.0, 14.0, 13.0, 17.0, 22.0, 17.0, 25.0, 33.0, 24.0, 34.0, 36.0, 45.0, 40.0, 28.0, 47.0, 52.0, 53.0, 40.0, 33.0, 37.0, 39.0, 39.0, 34.0, 39.0, 35.0, 24.0, 26.0, 23.0, 25.0, 17.0, 9.0, 7.0, 5.0, 7.0, 7.0, 3.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.814453125, -0.7899246215820312, -0.7653961181640625, -0.7408676147460938, -0.716339111328125, -0.6918106079101562, -0.6672821044921875, -0.6427536010742188, -0.61822509765625, -0.5936965942382812, -0.5691680908203125, -0.5446395874023438, -0.520111083984375, -0.49558258056640625, -0.4710540771484375, -0.44652557373046875, -0.4219970703125, -0.39746856689453125, -0.3729400634765625, -0.34841156005859375, -0.323883056640625, -0.29935455322265625, -0.2748260498046875, -0.25029754638671875, -0.22576904296875, -0.20124053955078125, -0.1767120361328125, -0.15218353271484375, -0.127655029296875, -0.10312652587890625, -0.0785980224609375, -0.05406951904296875, -0.029541015625, -0.00501251220703125, 0.0195159912109375, 0.04404449462890625, 0.068572998046875, 0.09310150146484375, 0.1176300048828125, 0.14215850830078125, 0.16668701171875, 0.19121551513671875, 0.2157440185546875, 0.24027252197265625, 0.264801025390625, 0.28932952880859375, 0.3138580322265625, 0.33838653564453125, 0.3629150390625, 0.38744354248046875, 0.4119720458984375, 0.43650054931640625, 0.461029052734375, 0.48555755615234375, 0.5100860595703125, 0.5346145629882812, 0.55914306640625, 0.5836715698242188, 0.6082000732421875, 0.6327285766601562, 0.657257080078125, 0.6817855834960938, 0.7063140869140625, 0.7308425903320312, 0.75537109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 2.0, 12.0, 7.0, 12.0, 29.0, 34.0, 42.0, 79.0, 161.0, 294.0, 664.0, 2158.0, 7947.0, 48523.0, 2216296.0, 1861102.0, 45454.0, 7820.0, 2184.0, 734.0, 319.0, 137.0, 85.0, 46.0, 45.0, 25.0, 21.0, 17.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.484375, -2.4090576171875, -2.333740234375, -2.2584228515625, -2.18310546875, -2.1077880859375, -2.032470703125, -1.9571533203125, -1.8818359375, -1.8065185546875, -1.731201171875, -1.6558837890625, -1.58056640625, -1.5052490234375, -1.429931640625, -1.3546142578125, -1.279296875, -1.2039794921875, -1.128662109375, -1.0533447265625, -0.97802734375, -0.9027099609375, -0.827392578125, -0.7520751953125, -0.6767578125, -0.6014404296875, -0.526123046875, -0.4508056640625, -0.37548828125, -0.3001708984375, -0.224853515625, -0.1495361328125, -0.07421875, 0.0010986328125, 0.076416015625, 0.1517333984375, 0.22705078125, 0.3023681640625, 0.377685546875, 0.4530029296875, 0.5283203125, 0.6036376953125, 0.678955078125, 0.7542724609375, 0.82958984375, 0.9049072265625, 0.980224609375, 1.0555419921875, 1.130859375, 1.2061767578125, 1.281494140625, 1.3568115234375, 1.43212890625, 1.5074462890625, 1.582763671875, 1.6580810546875, 1.7333984375, 1.8087158203125, 1.884033203125, 1.9593505859375, 2.03466796875, 2.1099853515625, 2.185302734375, 2.2606201171875, 2.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 3.0, 6.0, 6.0, 11.0, 18.0, 24.0, 39.0, 57.0, 96.0, 144.0, 281.0, 598.0, 1003.0, 839.0, 392.0, 218.0, 119.0, 74.0, 35.0, 22.0, 23.0, 21.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.475738525390625, -2.40655517578125, -2.337371826171875, -2.2681884765625, -2.199005126953125, -2.12982177734375, -2.060638427734375, -1.991455078125, -1.922271728515625, -1.85308837890625, -1.783905029296875, -1.7147216796875, -1.645538330078125, -1.57635498046875, -1.507171630859375, -1.43798828125, -1.368804931640625, -1.29962158203125, -1.230438232421875, -1.1612548828125, -1.092071533203125, -1.02288818359375, -0.953704833984375, -0.884521484375, -0.815338134765625, -0.74615478515625, -0.676971435546875, -0.6077880859375, -0.538604736328125, -0.46942138671875, -0.400238037109375, -0.3310546875, -0.261871337890625, -0.19268798828125, -0.123504638671875, -0.0543212890625, 0.014862060546875, 0.08404541015625, 0.153228759765625, 0.222412109375, 0.291595458984375, 0.36077880859375, 0.429962158203125, 0.4991455078125, 0.568328857421875, 0.63751220703125, 0.706695556640625, 0.77587890625, 0.845062255859375, 0.91424560546875, 0.983428955078125, 1.0526123046875, 1.121795654296875, 1.19097900390625, 1.260162353515625, 1.329345703125, 1.398529052734375, 1.46771240234375, 1.536895751953125, 1.6060791015625, 1.675262451171875, 1.74444580078125, 1.813629150390625, 1.8828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 43.0, 99.0, 284.0, 321.0, 158.0, 40.0, 21.0, 9.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.12636947631836, -35.36076354980469, -34.59516143798828, -33.829559326171875, -33.0639533996582, -32.29834747314453, -31.532745361328125, -30.767141342163086, -30.001537322998047, -29.235933303833008, -28.47032928466797, -27.70472526550293, -26.93912124633789, -26.17351722717285, -25.407913208007812, -24.642309188842773, -23.876705169677734, -23.111101150512695, -22.345497131347656, -21.579893112182617, -20.814289093017578, -20.04868507385254, -19.2830810546875, -18.51747703552246, -17.751873016357422, -16.986268997192383, -16.220664978027344, -15.455060958862305, -14.689456939697266, -13.923852920532227, -13.158248901367188, -12.392644882202148, -11.62704086303711, -10.86143684387207, -10.095832824707031, -9.330228805541992, -8.564624786376953, -7.799020767211914, -7.033416748046875, -6.267812728881836, -5.502208709716797, -4.736604690551758, -3.9710006713867188, -3.2053966522216797, -2.4397926330566406, -1.6741886138916016, -0.9085845947265625, -0.14298057556152344, 0.6226234436035156, 1.3882274627685547, 2.1538314819335938, 2.919435501098633, 3.685039520263672, 4.450643539428711, 5.21624755859375, 5.981851577758789, 6.747455596923828, 7.513059616088867, 8.278663635253906, 9.044267654418945, 9.809871673583984, 10.575475692749023, 11.341079711914062, 12.106683731079102, 12.87228775024414]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 15.0, 11.0, 11.0, 16.0, 18.0, 24.0, 18.0, 28.0, 37.0, 39.0, 48.0, 31.0, 41.0, 48.0, 51.0, 51.0, 54.0, 45.0, 43.0, 38.0, 44.0, 31.0, 31.0, 34.0, 20.0, 15.0, 25.0, 22.0, 10.0, 7.0, 14.0, 10.0, 9.0, 7.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.457266807556152, -6.251025199890137, -6.044783592224121, -5.838541507720947, -5.632299900054932, -5.426058292388916, -5.219816207885742, -5.013574600219727, -4.807332992553711, -4.601091384887695, -4.39484977722168, -4.188607692718506, -3.9823660850524902, -3.7761244773864746, -3.56988263130188, -3.363640785217285, -3.1573991775512695, -2.951157569885254, -2.744915723800659, -2.5386738777160645, -2.332432270050049, -2.126190662384033, -1.9199488162994385, -1.7137070894241333, -1.5074653625488281, -1.301223635673523, -1.0949819087982178, -0.8887401819229126, -0.6824984550476074, -0.47625672817230225, -0.27001500129699707, -0.0637732744216919, 0.14246892929077148, 0.34871065616607666, 0.5549523830413818, 0.761194109916687, 0.9674358367919922, 1.1736775636672974, 1.3799192905426025, 1.5861610174179077, 1.792402744293213, 1.998644471168518, 2.2048861980438232, 2.411128044128418, 2.6173696517944336, 2.823611259460449, 3.029853105545044, 3.2360949516296387, 3.4423365592956543, 3.64857816696167, 3.8548200130462646, 4.061061859130859, 4.267303466796875, 4.473545074462891, 4.679786682128906, 4.88602876663208, 5.092270374298096, 5.298511981964111, 5.504754066467285, 5.710995674133301, 5.917237281799316, 6.123478889465332, 6.329720497131348, 6.5359625816345215, 6.742204189300537]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 13.0, 20.0, 26.0, 32.0, 61.0, 102.0, 111.0, 174.0, 250.0, 370.0, 531.0, 898.0, 1415.0, 2227.0, 3727.0, 6667.0, 12690.0, 27454.0, 67152.0, 187711.0, 420290.0, 190945.0, 68009.0, 28087.0, 12918.0, 6560.0, 3861.0, 2214.0, 1353.0, 848.0, 615.0, 367.0, 266.0, 198.0, 120.0, 82.0, 66.0, 32.0, 35.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.5431671142578125, -1.492584228515625, -1.4420013427734375, -1.39141845703125, -1.3408355712890625, -1.290252685546875, -1.2396697998046875, -1.1890869140625, -1.1385040283203125, -1.087921142578125, -1.0373382568359375, -0.98675537109375, -0.9361724853515625, -0.885589599609375, -0.8350067138671875, -0.784423828125, -0.7338409423828125, -0.683258056640625, -0.6326751708984375, -0.58209228515625, -0.5315093994140625, -0.480926513671875, -0.4303436279296875, -0.3797607421875, -0.3291778564453125, -0.278594970703125, -0.2280120849609375, -0.17742919921875, -0.1268463134765625, -0.076263427734375, -0.0256805419921875, 0.02490234375, 0.0754852294921875, 0.126068115234375, 0.1766510009765625, 0.22723388671875, 0.2778167724609375, 0.328399658203125, 0.3789825439453125, 0.4295654296875, 0.4801483154296875, 0.530731201171875, 0.5813140869140625, 0.63189697265625, 0.6824798583984375, 0.733062744140625, 0.7836456298828125, 0.834228515625, 0.8848114013671875, 0.935394287109375, 0.9859771728515625, 1.03656005859375, 1.0871429443359375, 1.137725830078125, 1.1883087158203125, 1.2388916015625, 1.2894744873046875, 1.340057373046875, 1.3906402587890625, 1.44122314453125, 1.4918060302734375, 1.542388916015625, 1.5929718017578125, 1.6435546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 8.0, 5.0, 8.0, 15.0, 13.0, 20.0, 17.0, 25.0, 22.0, 34.0, 29.0, 33.0, 39.0, 30.0, 34.0, 55.0, 50.0, 39.0, 53.0, 45.0, 38.0, 37.0, 33.0, 40.0, 36.0, 35.0, 35.0, 27.0, 27.0, 22.0, 20.0, 21.0, 11.0, 7.0, 6.0, 7.0, 1.0, 8.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7744140625, -0.7486953735351562, -0.7229766845703125, -0.6972579956054688, -0.671539306640625, -0.6458206176757812, -0.6201019287109375, -0.5943832397460938, -0.56866455078125, -0.5429458618164062, -0.5172271728515625, -0.49150848388671875, -0.465789794921875, -0.44007110595703125, -0.4143524169921875, -0.38863372802734375, -0.3629150390625, -0.33719635009765625, -0.3114776611328125, -0.28575897216796875, -0.260040283203125, -0.23432159423828125, -0.2086029052734375, -0.18288421630859375, -0.15716552734375, -0.13144683837890625, -0.1057281494140625, -0.08000946044921875, -0.054290771484375, -0.02857208251953125, -0.0028533935546875, 0.02286529541015625, 0.048583984375, 0.07430267333984375, 0.1000213623046875, 0.12574005126953125, 0.151458740234375, 0.17717742919921875, 0.2028961181640625, 0.22861480712890625, 0.25433349609375, 0.28005218505859375, 0.3057708740234375, 0.33148956298828125, 0.357208251953125, 0.38292694091796875, 0.4086456298828125, 0.43436431884765625, 0.4600830078125, 0.48580169677734375, 0.5115203857421875, 0.5372390747070312, 0.562957763671875, 0.5886764526367188, 0.6143951416015625, 0.6401138305664062, 0.66583251953125, 0.6915512084960938, 0.7172698974609375, 0.7429885864257812, 0.768707275390625, 0.7944259643554688, 0.8201446533203125, 0.8458633422851562, 0.87158203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 5.0, 11.0, 10.0, 11.0, 20.0, 20.0, 16.0, 22.0, 47.0, 54.0, 78.0, 110.0, 140.0, 189.0, 269.0, 370.0, 616.0, 1104.0, 2334.0, 5411.0, 17139.0, 78631.0, 747940.0, 152626.0, 26924.0, 7830.0, 2967.0, 1407.0, 767.0, 485.0, 282.0, 171.0, 140.0, 95.0, 76.0, 47.0, 44.0, 44.0, 25.0, 16.0, 15.0, 12.0, 7.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.564453125, -2.490478515625, -2.41650390625, -2.342529296875, -2.2685546875, -2.194580078125, -2.12060546875, -2.046630859375, -1.97265625, -1.898681640625, -1.82470703125, -1.750732421875, -1.6767578125, -1.602783203125, -1.52880859375, -1.454833984375, -1.380859375, -1.306884765625, -1.23291015625, -1.158935546875, -1.0849609375, -1.010986328125, -0.93701171875, -0.863037109375, -0.7890625, -0.715087890625, -0.64111328125, -0.567138671875, -0.4931640625, -0.419189453125, -0.34521484375, -0.271240234375, -0.197265625, -0.123291015625, -0.04931640625, 0.024658203125, 0.0986328125, 0.172607421875, 0.24658203125, 0.320556640625, 0.39453125, 0.468505859375, 0.54248046875, 0.616455078125, 0.6904296875, 0.764404296875, 0.83837890625, 0.912353515625, 0.986328125, 1.060302734375, 1.13427734375, 1.208251953125, 1.2822265625, 1.356201171875, 1.43017578125, 1.504150390625, 1.578125, 1.652099609375, 1.72607421875, 1.800048828125, 1.8740234375, 1.947998046875, 2.02197265625, 2.095947265625, 2.169921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 5.0, 8.0, 14.0, 10.0, 22.0, 24.0, 17.0, 22.0, 22.0, 32.0, 30.0, 32.0, 42.0, 40.0, 45.0, 63.0, 49.0, 63.0, 55.0, 46.0, 43.0, 38.0, 33.0, 25.0, 25.0, 20.0, 24.0, 23.0, 23.0, 10.0, 10.0, 12.0, 8.0, 18.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9903564453125, -2.902587890625, -2.8148193359375, -2.72705078125, -2.6392822265625, -2.551513671875, -2.4637451171875, -2.3759765625, -2.2882080078125, -2.200439453125, -2.1126708984375, -2.02490234375, -1.9371337890625, -1.849365234375, -1.7615966796875, -1.673828125, -1.5860595703125, -1.498291015625, -1.4105224609375, -1.32275390625, -1.2349853515625, -1.147216796875, -1.0594482421875, -0.9716796875, -0.8839111328125, -0.796142578125, -0.7083740234375, -0.62060546875, -0.5328369140625, -0.445068359375, -0.3572998046875, -0.26953125, -0.1817626953125, -0.093994140625, -0.0062255859375, 0.08154296875, 0.1693115234375, 0.257080078125, 0.3448486328125, 0.4326171875, 0.5203857421875, 0.608154296875, 0.6959228515625, 0.78369140625, 0.8714599609375, 0.959228515625, 1.0469970703125, 1.134765625, 1.2225341796875, 1.310302734375, 1.3980712890625, 1.48583984375, 1.5736083984375, 1.661376953125, 1.7491455078125, 1.8369140625, 1.9246826171875, 2.012451171875, 2.1002197265625, 2.18798828125, 2.2757568359375, 2.363525390625, 2.4512939453125, 2.5390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 3.0, 7.0, 19.0, 20.0, 23.0, 29.0, 59.0, 95.0, 135.0, 238.0, 380.0, 730.0, 1425.0, 3273.0, 9755.0, 39766.0, 282590.0, 639683.0, 51249.0, 11790.0, 3851.0, 1565.0, 795.0, 376.0, 239.0, 149.0, 97.0, 47.0, 34.0, 30.0, 19.0, 18.0, 8.0, 7.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.598419189453125, -0.57916259765625, -0.559906005859375, -0.5406494140625, -0.521392822265625, -0.50213623046875, -0.482879638671875, -0.463623046875, -0.444366455078125, -0.42510986328125, -0.405853271484375, -0.3865966796875, -0.367340087890625, -0.34808349609375, -0.328826904296875, -0.3095703125, -0.290313720703125, -0.27105712890625, -0.251800537109375, -0.2325439453125, -0.213287353515625, -0.19403076171875, -0.174774169921875, -0.155517578125, -0.136260986328125, -0.11700439453125, -0.097747802734375, -0.0784912109375, -0.059234619140625, -0.03997802734375, -0.020721435546875, -0.00146484375, 0.017791748046875, 0.03704833984375, 0.056304931640625, 0.0755615234375, 0.094818115234375, 0.11407470703125, 0.133331298828125, 0.152587890625, 0.171844482421875, 0.19110107421875, 0.210357666015625, 0.2296142578125, 0.248870849609375, 0.26812744140625, 0.287384033203125, 0.306640625, 0.325897216796875, 0.34515380859375, 0.364410400390625, 0.3836669921875, 0.402923583984375, 0.42218017578125, 0.441436767578125, 0.460693359375, 0.479949951171875, 0.49920654296875, 0.518463134765625, 0.5377197265625, 0.556976318359375, 0.57623291015625, 0.595489501953125, 0.61474609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 14.0, 28.0, 35.0, 61.0, 92.0, 124.0, 145.0, 149.0, 88.0, 62.0, 50.0, 34.0, 29.0, 11.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028777122497558594, -0.00028052181005477905, -0.00027327239513397217, -0.0002660229802131653, -0.0002587735652923584, -0.0002515241503715515, -0.00024427473545074463, -0.00023702532052993774, -0.00022977590560913086, -0.00022252649068832397, -0.0002152770757675171, -0.0002080276608467102, -0.00020077824592590332, -0.00019352883100509644, -0.00018627941608428955, -0.00017903000116348267, -0.00017178058624267578, -0.0001645311713218689, -0.000157281756401062, -0.00015003234148025513, -0.00014278292655944824, -0.00013553351163864136, -0.00012828409671783447, -0.00012103468179702759, -0.0001137852668762207, -0.00010653585195541382, -9.928643703460693e-05, -9.203702211380005e-05, -8.478760719299316e-05, -7.753819227218628e-05, -7.02887773513794e-05, -6.303936243057251e-05, -5.5789947509765625e-05, -4.854053258895874e-05, -4.1291117668151855e-05, -3.404170274734497e-05, -2.6792287826538086e-05, -1.95428729057312e-05, -1.2293457984924316e-05, -5.044043064117432e-06, 2.205371856689453e-06, 9.454786777496338e-06, 1.6704201698303223e-05, 2.3953616619110107e-05, 3.120303153991699e-05, 3.845244646072388e-05, 4.570186138153076e-05, 5.2951276302337646e-05, 6.020069122314453e-05, 6.745010614395142e-05, 7.46995210647583e-05, 8.194893598556519e-05, 8.919835090637207e-05, 9.644776582717896e-05, 0.00010369718074798584, 0.00011094659566879272, 0.00011819601058959961, 0.0001254454255104065, 0.00013269484043121338, 0.00013994425535202026, 0.00014719367027282715, 0.00015444308519363403, 0.00016169250011444092, 0.0001689419150352478, 0.0001761913299560547]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 7.0, 10.0, 8.0, 15.0, 8.0, 30.0, 35.0, 49.0, 62.0, 89.0, 128.0, 222.0, 364.0, 635.0, 1458.0, 3490.0, 10073.0, 43685.0, 429673.0, 497415.0, 44367.0, 10202.0, 3483.0, 1340.0, 649.0, 380.0, 216.0, 126.0, 96.0, 58.0, 49.0, 30.0, 23.0, 21.0, 11.0, 13.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5947265625, -0.5767059326171875, -0.558685302734375, -0.5406646728515625, -0.52264404296875, -0.5046234130859375, -0.486602783203125, -0.4685821533203125, -0.4505615234375, -0.4325408935546875, -0.414520263671875, -0.3964996337890625, -0.37847900390625, -0.3604583740234375, -0.342437744140625, -0.3244171142578125, -0.306396484375, -0.2883758544921875, -0.270355224609375, -0.2523345947265625, -0.23431396484375, -0.2162933349609375, -0.198272705078125, -0.1802520751953125, -0.1622314453125, -0.1442108154296875, -0.126190185546875, -0.1081695556640625, -0.09014892578125, -0.0721282958984375, -0.054107666015625, -0.0360870361328125, -0.01806640625, -4.57763671875e-05, 0.017974853515625, 0.0359954833984375, 0.05401611328125, 0.0720367431640625, 0.090057373046875, 0.1080780029296875, 0.1260986328125, 0.1441192626953125, 0.162139892578125, 0.1801605224609375, 0.19818115234375, 0.2162017822265625, 0.234222412109375, 0.2522430419921875, 0.270263671875, 0.2882843017578125, 0.306304931640625, 0.3243255615234375, 0.34234619140625, 0.3603668212890625, 0.378387451171875, 0.3964080810546875, 0.4144287109375, 0.4324493408203125, 0.450469970703125, 0.4684906005859375, 0.48651123046875, 0.5045318603515625, 0.522552490234375, 0.5405731201171875, 0.55859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 1.0, 8.0, 13.0, 12.0, 18.0, 15.0, 16.0, 26.0, 32.0, 37.0, 43.0, 55.0, 53.0, 59.0, 74.0, 60.0, 63.0, 67.0, 64.0, 38.0, 39.0, 33.0, 31.0, 18.0, 23.0, 14.0, 9.0, 12.0, 9.0, 14.0, 3.0, 4.0, 5.0, 0.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4462890625, -0.43256378173828125, -0.4188385009765625, -0.40511322021484375, -0.391387939453125, -0.37766265869140625, -0.3639373779296875, -0.35021209716796875, -0.33648681640625, -0.32276153564453125, -0.3090362548828125, -0.29531097412109375, -0.281585693359375, -0.26786041259765625, -0.2541351318359375, -0.24040985107421875, -0.2266845703125, -0.21295928955078125, -0.1992340087890625, -0.18550872802734375, -0.171783447265625, -0.15805816650390625, -0.1443328857421875, -0.13060760498046875, -0.11688232421875, -0.10315704345703125, -0.0894317626953125, -0.07570648193359375, -0.061981201171875, -0.04825592041015625, -0.0345306396484375, -0.02080535888671875, -0.007080078125, 0.00664520263671875, 0.0203704833984375, 0.03409576416015625, 0.047821044921875, 0.06154632568359375, 0.0752716064453125, 0.08899688720703125, 0.10272216796875, 0.11644744873046875, 0.1301727294921875, 0.14389801025390625, 0.157623291015625, 0.17134857177734375, 0.1850738525390625, 0.19879913330078125, 0.2125244140625, 0.22624969482421875, 0.2399749755859375, 0.25370025634765625, 0.267425537109375, 0.28115081787109375, 0.2948760986328125, 0.30860137939453125, 0.32232666015625, 0.33605194091796875, 0.3497772216796875, 0.36350250244140625, 0.377227783203125, 0.39095306396484375, 0.4046783447265625, 0.41840362548828125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 11.0, 23.0, 49.0, 97.0, 331.0, 227.0, 112.0, 53.0, 39.0, 25.0, 12.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.293344497680664, -12.657795906066895, -12.022247314453125, -11.386699676513672, -10.751151084899902, -10.115602493286133, -9.48005485534668, -8.84450626373291, -8.20895767211914, -7.573409080505371, -6.93786096572876, -6.302312850952148, -5.666764259338379, -5.031215667724609, -4.395667552947998, -3.7601194381713867, -3.124570846557617, -2.4890224933624268, -1.8534741401672363, -1.217925786972046, -0.5823774337768555, 0.05317091941833496, 0.6887192726135254, 1.3242673873901367, 1.9598159790039062, 2.5953643321990967, 3.230912685394287, 3.8664610385894775, 4.502009391784668, 5.1375579833984375, 5.773106098175049, 6.40865421295166, 7.0442047119140625, 7.679753303527832, 8.315301895141602, 8.950849533081055, 9.586398124694824, 10.221946716308594, 10.857494354248047, 11.493042945861816, 12.128591537475586, 12.764140129089355, 13.399688720703125, 14.035236358642578, 14.670784950256348, 15.306333541870117, 15.94188117980957, 16.577430725097656, 17.21297836303711, 17.848526000976562, 18.48407554626465, 19.1196231842041, 19.755172729492188, 20.39072036743164, 21.026268005371094, 21.661815643310547, 22.297365188598633, 22.932912826538086, 23.568462371826172, 24.204010009765625, 24.839557647705078, 25.475107192993164, 26.110654830932617, 26.746204376220703, 27.381752014160156]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 9.0, 7.0, 14.0, 13.0, 18.0, 12.0, 19.0, 19.0, 21.0, 20.0, 25.0, 30.0, 39.0, 35.0, 39.0, 68.0, 86.0, 128.0, 88.0, 42.0, 33.0, 28.0, 23.0, 14.0, 23.0, 17.0, 17.0, 19.0, 11.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.808591842651367, -9.52204418182373, -9.235495567321777, -8.94894790649414, -8.662399291992188, -8.37585163116455, -8.089303970336914, -7.802755832672119, -7.516207695007324, -7.229659557342529, -6.943111419677734, -6.656563758850098, -6.370015621185303, -6.083467483520508, -5.796919822692871, -5.510371685028076, -5.223823547363281, -4.937275409698486, -4.650727272033691, -4.364179611206055, -4.07763147354126, -3.791083335876465, -3.504535436630249, -3.217987537384033, -2.9314393997192383, -2.6448912620544434, -2.3583433628082275, -2.0717954635620117, -1.7852473258972168, -1.4986993074417114, -1.212151288986206, -0.9256033897399902, -0.6390552520751953, -0.35250723361968994, -0.06595921516418457, 0.2205888032913208, 0.5071368217468262, 0.7936848402023315, 1.080232858657837, 1.3667807579040527, 1.6533288955688477, 1.939876914024353, 2.2264249324798584, 2.512972831726074, 2.799520969390869, 3.086069107055664, 3.37261700630188, 3.6591649055480957, 3.9457130432128906, 4.2322611808776855, 4.5188093185424805, 4.805356979370117, 5.091905117034912, 5.378453254699707, 5.665000915527344, 5.951549053192139, 6.238097190856934, 6.5246453285217285, 6.811193466186523, 7.09774112701416, 7.384289264678955, 7.67083740234375, 7.957385063171387, 8.243932723999023, 8.530481338500977]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 18.0, 31.0, 25.0, 51.0, 79.0, 107.0, 173.0, 266.0, 458.0, 827.0, 1513.0, 3283.0, 8334.0, 27599.0, 136975.0, 1365623.0, 2345134.0, 244145.0, 39880.0, 11158.0, 4269.0, 1904.0, 968.0, 558.0, 345.0, 178.0, 135.0, 69.0, 44.0, 38.0, 25.0, 18.0, 16.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.98114013671875, -1.9154052734375, -1.84967041015625, -1.783935546875, -1.71820068359375, -1.6524658203125, -1.58673095703125, -1.52099609375, -1.45526123046875, -1.3895263671875, -1.32379150390625, -1.258056640625, -1.19232177734375, -1.1265869140625, -1.06085205078125, -0.9951171875, -0.92938232421875, -0.8636474609375, -0.79791259765625, -0.732177734375, -0.66644287109375, -0.6007080078125, -0.53497314453125, -0.46923828125, -0.40350341796875, -0.3377685546875, -0.27203369140625, -0.206298828125, -0.14056396484375, -0.0748291015625, -0.00909423828125, 0.056640625, 0.12237548828125, 0.1881103515625, 0.25384521484375, 0.319580078125, 0.38531494140625, 0.4510498046875, 0.51678466796875, 0.58251953125, 0.64825439453125, 0.7139892578125, 0.77972412109375, 0.845458984375, 0.91119384765625, 0.9769287109375, 1.04266357421875, 1.1083984375, 1.17413330078125, 1.2398681640625, 1.30560302734375, 1.371337890625, 1.43707275390625, 1.5028076171875, 1.56854248046875, 1.63427734375, 1.70001220703125, 1.7657470703125, 1.83148193359375, 1.897216796875, 1.96295166015625, 2.0286865234375, 2.09442138671875, 2.16015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 15.0, 9.0, 15.0, 23.0, 26.0, 29.0, 22.0, 26.0, 51.0, 41.0, 38.0, 43.0, 32.0, 53.0, 65.0, 54.0, 52.0, 37.0, 42.0, 35.0, 30.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 16.0, 15.0, 9.0, 6.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.767578125, -0.7418289184570312, -0.7160797119140625, -0.6903305053710938, -0.664581298828125, -0.6388320922851562, -0.6130828857421875, -0.5873336791992188, -0.56158447265625, -0.5358352661132812, -0.5100860595703125, -0.48433685302734375, -0.458587646484375, -0.43283843994140625, -0.4070892333984375, -0.38134002685546875, -0.3555908203125, -0.32984161376953125, -0.3040924072265625, -0.27834320068359375, -0.252593994140625, -0.22684478759765625, -0.2010955810546875, -0.17534637451171875, -0.14959716796875, -0.12384796142578125, -0.0980987548828125, -0.07234954833984375, -0.046600341796875, -0.02085113525390625, 0.0048980712890625, 0.03064727783203125, 0.056396484375, 0.08214569091796875, 0.1078948974609375, 0.13364410400390625, 0.159393310546875, 0.18514251708984375, 0.2108917236328125, 0.23664093017578125, 0.26239013671875, 0.28813934326171875, 0.3138885498046875, 0.33963775634765625, 0.365386962890625, 0.39113616943359375, 0.4168853759765625, 0.44263458251953125, 0.4683837890625, 0.49413299560546875, 0.5198822021484375, 0.5456314086914062, 0.571380615234375, 0.5971298217773438, 0.6228790283203125, 0.6486282348632812, 0.67437744140625, 0.7001266479492188, 0.7258758544921875, 0.7516250610351562, 0.777374267578125, 0.8031234741210938, 0.8288726806640625, 0.8546218872070312, 0.88037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 6.0, 7.0, 12.0, 15.0, 16.0, 26.0, 38.0, 64.0, 90.0, 153.0, 259.0, 462.0, 959.0, 2372.0, 7865.0, 66454.0, 3787899.0, 305348.0, 15811.0, 3670.0, 1310.0, 615.0, 307.0, 175.0, 108.0, 75.0, 55.0, 40.0, 20.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.1640625, -5.027099609375, -4.89013671875, -4.753173828125, -4.6162109375, -4.479248046875, -4.34228515625, -4.205322265625, -4.068359375, -3.931396484375, -3.79443359375, -3.657470703125, -3.5205078125, -3.383544921875, -3.24658203125, -3.109619140625, -2.97265625, -2.835693359375, -2.69873046875, -2.561767578125, -2.4248046875, -2.287841796875, -2.15087890625, -2.013916015625, -1.876953125, -1.739990234375, -1.60302734375, -1.466064453125, -1.3291015625, -1.192138671875, -1.05517578125, -0.918212890625, -0.78125, -0.644287109375, -0.50732421875, -0.370361328125, -0.2333984375, -0.096435546875, 0.04052734375, 0.177490234375, 0.314453125, 0.451416015625, 0.58837890625, 0.725341796875, 0.8623046875, 0.999267578125, 1.13623046875, 1.273193359375, 1.41015625, 1.547119140625, 1.68408203125, 1.821044921875, 1.9580078125, 2.094970703125, 2.23193359375, 2.368896484375, 2.505859375, 2.642822265625, 2.77978515625, 2.916748046875, 3.0537109375, 3.190673828125, 3.32763671875, 3.464599609375, 3.6015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 8.0, 18.0, 27.0, 26.0, 40.0, 68.0, 77.0, 143.0, 228.0, 392.0, 591.0, 825.0, 588.0, 332.0, 226.0, 153.0, 87.0, 82.0, 51.0, 35.0, 22.0, 7.0, 10.0, 12.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.610626220703125, -2.50836181640625, -2.406097412109375, -2.3038330078125, -2.201568603515625, -2.09930419921875, -1.997039794921875, -1.894775390625, -1.792510986328125, -1.69024658203125, -1.587982177734375, -1.4857177734375, -1.383453369140625, -1.28118896484375, -1.178924560546875, -1.07666015625, -0.974395751953125, -0.87213134765625, -0.769866943359375, -0.6676025390625, -0.565338134765625, -0.46307373046875, -0.360809326171875, -0.258544921875, -0.156280517578125, -0.05401611328125, 0.048248291015625, 0.1505126953125, 0.252777099609375, 0.35504150390625, 0.457305908203125, 0.5595703125, 0.661834716796875, 0.76409912109375, 0.866363525390625, 0.9686279296875, 1.070892333984375, 1.17315673828125, 1.275421142578125, 1.377685546875, 1.479949951171875, 1.58221435546875, 1.684478759765625, 1.7867431640625, 1.889007568359375, 1.99127197265625, 2.093536376953125, 2.19580078125, 2.298065185546875, 2.40032958984375, 2.502593994140625, 2.6048583984375, 2.707122802734375, 2.80938720703125, 2.911651611328125, 3.013916015625, 3.116180419921875, 3.21844482421875, 3.320709228515625, 3.4229736328125, 3.525238037109375, 3.62750244140625, 3.729766845703125, 3.83203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 16.0, 27.0, 33.0, 83.0, 151.0, 212.0, 198.0, 116.0, 52.0, 38.0, 18.0, 13.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.202171325683594, -34.131813049316406, -33.06145477294922, -31.99109649658203, -30.920738220214844, -29.850379943847656, -28.78002166748047, -27.70966339111328, -26.639305114746094, -25.568946838378906, -24.49858856201172, -23.42823028564453, -22.357872009277344, -21.287513732910156, -20.21715545654297, -19.14679718017578, -18.076440811157227, -17.00608253479004, -15.935724258422852, -14.865365982055664, -13.795007705688477, -12.724649429321289, -11.654292106628418, -10.58393383026123, -9.513575553894043, -8.443217277526855, -7.372859001159668, -6.302501201629639, -5.232142925262451, -4.161784648895264, -3.0914268493652344, -2.021068572998047, -0.9507102966308594, 0.11964786052703857, 1.1900060176849365, 2.260364055633545, 3.3307223320007324, 4.40108060836792, 5.471438407897949, 6.541796684265137, 7.612154960632324, 8.682513236999512, 9.7528715133667, 10.82322883605957, 11.893587112426758, 12.963945388793945, 14.034303665161133, 15.10466194152832, 16.175020217895508, 17.245378494262695, 18.315736770629883, 19.38609504699707, 20.456453323364258, 21.526811599731445, 22.59716796875, 23.667526245117188, 24.737884521484375, 25.808242797851562, 26.87860107421875, 27.948959350585938, 29.019317626953125, 30.089675903320312, 31.1600341796875, 32.23039245605469, 33.300750732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 7.0, 9.0, 6.0, 13.0, 15.0, 15.0, 18.0, 24.0, 20.0, 33.0, 32.0, 45.0, 35.0, 42.0, 48.0, 57.0, 58.0, 61.0, 60.0, 53.0, 46.0, 40.0, 43.0, 31.0, 37.0, 17.0, 22.0, 16.0, 28.0, 7.0, 17.0, 9.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.340259552001953, -14.857845306396484, -14.375432014465332, -13.893017768859863, -13.410604476928711, -12.928190231323242, -12.445775985717773, -11.963362693786621, -11.480949401855469, -10.99853515625, -10.516121864318848, -10.033707618713379, -9.551294326782227, -9.068880081176758, -8.586465835571289, -8.104052543640137, -7.621638298034668, -7.139224529266357, -6.656810760498047, -6.174396514892578, -5.691983222961426, -5.209568977355957, -4.7271552085876465, -4.244741439819336, -3.7623276710510254, -3.279913902282715, -2.7975001335144043, -2.3150861263275146, -1.832672357559204, -1.3502585887908936, -0.8678445816040039, -0.38543081283569336, 0.0969839096069336, 0.5793977379798889, 1.0618115663528442, 1.5442254543304443, 2.026639223098755, 2.5090529918670654, 2.991466999053955, 3.4738807678222656, 3.956294536590576, 4.438708305358887, 4.921122074127197, 5.403535842895508, 5.885950088500977, 6.368363380432129, 6.850777626037598, 7.333191394805908, 7.815605163574219, 8.298019409179688, 8.78043270111084, 9.262846946716309, 9.745260238647461, 10.22767448425293, 10.710088729858398, 11.19250202178955, 11.674915313720703, 12.157329559326172, 12.639742851257324, 13.122157096862793, 13.604570388793945, 14.086984634399414, 14.569398880004883, 15.051812171936035, 15.534226417541504]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 41.0, 52.0, 73.0, 111.0, 177.0, 244.0, 429.0, 655.0, 1116.0, 1935.0, 3375.0, 5853.0, 11200.0, 22545.0, 52054.0, 150481.0, 535166.0, 159386.0, 54057.0, 23466.0, 11501.0, 6023.0, 3445.0, 2039.0, 1147.0, 647.0, 422.0, 284.0, 183.0, 107.0, 81.0, 49.0, 31.0, 29.0, 19.0, 11.0, 10.0, 9.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.35546875, -1.315032958984375, -1.27459716796875, -1.234161376953125, -1.1937255859375, -1.153289794921875, -1.11285400390625, -1.072418212890625, -1.031982421875, -0.991546630859375, -0.95111083984375, -0.910675048828125, -0.8702392578125, -0.829803466796875, -0.78936767578125, -0.748931884765625, -0.70849609375, -0.668060302734375, -0.62762451171875, -0.587188720703125, -0.5467529296875, -0.506317138671875, -0.46588134765625, -0.425445556640625, -0.385009765625, -0.344573974609375, -0.30413818359375, -0.263702392578125, -0.2232666015625, -0.182830810546875, -0.14239501953125, -0.101959228515625, -0.0615234375, -0.021087646484375, 0.01934814453125, 0.059783935546875, 0.1002197265625, 0.140655517578125, 0.18109130859375, 0.221527099609375, 0.261962890625, 0.302398681640625, 0.34283447265625, 0.383270263671875, 0.4237060546875, 0.464141845703125, 0.50457763671875, 0.545013427734375, 0.58544921875, 0.625885009765625, 0.66632080078125, 0.706756591796875, 0.7471923828125, 0.787628173828125, 0.82806396484375, 0.868499755859375, 0.908935546875, 0.949371337890625, 0.98980712890625, 1.030242919921875, 1.0706787109375, 1.111114501953125, 1.15155029296875, 1.191986083984375, 1.232421875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 9.0, 15.0, 14.0, 14.0, 22.0, 18.0, 25.0, 30.0, 39.0, 39.0, 40.0, 50.0, 74.0, 49.0, 54.0, 72.0, 61.0, 51.0, 34.0, 51.0, 33.0, 27.0, 37.0, 30.0, 29.0, 20.0, 11.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.193359375, -1.157928466796875, -1.12249755859375, -1.087066650390625, -1.0516357421875, -1.016204833984375, -0.98077392578125, -0.945343017578125, -0.909912109375, -0.874481201171875, -0.83905029296875, -0.803619384765625, -0.7681884765625, -0.732757568359375, -0.69732666015625, -0.661895751953125, -0.62646484375, -0.591033935546875, -0.55560302734375, -0.520172119140625, -0.4847412109375, -0.449310302734375, -0.41387939453125, -0.378448486328125, -0.343017578125, -0.307586669921875, -0.27215576171875, -0.236724853515625, -0.2012939453125, -0.165863037109375, -0.13043212890625, -0.095001220703125, -0.0595703125, -0.024139404296875, 0.01129150390625, 0.046722412109375, 0.0821533203125, 0.117584228515625, 0.15301513671875, 0.188446044921875, 0.223876953125, 0.259307861328125, 0.29473876953125, 0.330169677734375, 0.3656005859375, 0.401031494140625, 0.43646240234375, 0.471893310546875, 0.50732421875, 0.542755126953125, 0.57818603515625, 0.613616943359375, 0.6490478515625, 0.684478759765625, 0.71990966796875, 0.755340576171875, 0.790771484375, 0.826202392578125, 0.86163330078125, 0.897064208984375, 0.9324951171875, 0.967926025390625, 1.00335693359375, 1.038787841796875, 1.07421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 7.0, 18.0, 30.0, 44.0, 57.0, 114.0, 189.0, 336.0, 765.0, 2146.0, 9174.0, 142000.0, 872407.0, 16223.0, 3057.0, 1038.0, 433.0, 203.0, 111.0, 53.0, 34.0, 31.0, 21.0, 18.0, 10.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.59765625, -5.464813232421875, -5.33197021484375, -5.199127197265625, -5.0662841796875, -4.933441162109375, -4.80059814453125, -4.667755126953125, -4.534912109375, -4.402069091796875, -4.26922607421875, -4.136383056640625, -4.0035400390625, -3.870697021484375, -3.73785400390625, -3.605010986328125, -3.47216796875, -3.339324951171875, -3.20648193359375, -3.073638916015625, -2.9407958984375, -2.807952880859375, -2.67510986328125, -2.542266845703125, -2.409423828125, -2.276580810546875, -2.14373779296875, -2.010894775390625, -1.8780517578125, -1.745208740234375, -1.61236572265625, -1.479522705078125, -1.3466796875, -1.213836669921875, -1.08099365234375, -0.948150634765625, -0.8153076171875, -0.682464599609375, -0.54962158203125, -0.416778564453125, -0.283935546875, -0.151092529296875, -0.01824951171875, 0.114593505859375, 0.2474365234375, 0.380279541015625, 0.51312255859375, 0.645965576171875, 0.77880859375, 0.911651611328125, 1.04449462890625, 1.177337646484375, 1.3101806640625, 1.443023681640625, 1.57586669921875, 1.708709716796875, 1.841552734375, 1.974395751953125, 2.10723876953125, 2.240081787109375, 2.3729248046875, 2.505767822265625, 2.63861083984375, 2.771453857421875, 2.904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 24.0, 24.0, 16.0, 24.0, 27.0, 25.0, 39.0, 60.0, 56.0, 98.0, 118.0, 88.0, 67.0, 51.0, 48.0, 37.0, 31.0, 33.0, 16.0, 18.0, 11.0, 9.0, 11.0, 8.0, 6.0, 4.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.56707763671875, -5.3958740234375, -5.22467041015625, -5.053466796875, -4.88226318359375, -4.7110595703125, -4.53985595703125, -4.36865234375, -4.19744873046875, -4.0262451171875, -3.85504150390625, -3.683837890625, -3.51263427734375, -3.3414306640625, -3.17022705078125, -2.9990234375, -2.82781982421875, -2.6566162109375, -2.48541259765625, -2.314208984375, -2.14300537109375, -1.9718017578125, -1.80059814453125, -1.62939453125, -1.45819091796875, -1.2869873046875, -1.11578369140625, -0.944580078125, -0.77337646484375, -0.6021728515625, -0.43096923828125, -0.259765625, -0.08856201171875, 0.0826416015625, 0.25384521484375, 0.425048828125, 0.59625244140625, 0.7674560546875, 0.93865966796875, 1.10986328125, 1.28106689453125, 1.4522705078125, 1.62347412109375, 1.794677734375, 1.96588134765625, 2.1370849609375, 2.30828857421875, 2.4794921875, 2.65069580078125, 2.8218994140625, 2.99310302734375, 3.164306640625, 3.33551025390625, 3.5067138671875, 3.67791748046875, 3.84912109375, 4.02032470703125, 4.1915283203125, 4.36273193359375, 4.533935546875, 4.70513916015625, 4.8763427734375, 5.04754638671875, 5.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 10.0, 12.0, 16.0, 21.0, 38.0, 80.0, 96.0, 149.0, 211.0, 334.0, 620.0, 1133.0, 2423.0, 6551.0, 23424.0, 168384.0, 792187.0, 37347.0, 9012.0, 3178.0, 1446.0, 706.0, 400.0, 233.0, 167.0, 121.0, 75.0, 49.0, 27.0, 21.0, 16.0, 5.0, 6.0, 5.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.56591796875, -0.5498161315917969, -0.5337142944335938, -0.5176124572753906, -0.5015106201171875, -0.4854087829589844, -0.46930694580078125, -0.4532051086425781, -0.437103271484375, -0.4210014343261719, -0.40489959716796875, -0.3887977600097656, -0.3726959228515625, -0.3565940856933594, -0.34049224853515625, -0.3243904113769531, -0.30828857421875, -0.2921867370605469, -0.27608489990234375, -0.2599830627441406, -0.2438812255859375, -0.22777938842773438, -0.21167755126953125, -0.19557571411132812, -0.179473876953125, -0.16337203979492188, -0.14727020263671875, -0.13116836547851562, -0.1150665283203125, -0.09896469116210938, -0.08286285400390625, -0.06676101684570312, -0.0506591796875, -0.034557342529296875, -0.01845550537109375, -0.002353668212890625, 0.0137481689453125, 0.029850006103515625, 0.04595184326171875, 0.062053680419921875, 0.078155517578125, 0.09425735473632812, 0.11035919189453125, 0.12646102905273438, 0.1425628662109375, 0.15866470336914062, 0.17476654052734375, 0.19086837768554688, 0.20697021484375, 0.22307205200195312, 0.23917388916015625, 0.2552757263183594, 0.2713775634765625, 0.2874794006347656, 0.30358123779296875, 0.3196830749511719, 0.335784912109375, 0.3518867492675781, 0.36798858642578125, 0.3840904235839844, 0.4001922607421875, 0.4162940979003906, 0.43239593505859375, 0.4484977722167969, 0.464599609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 11.0, 25.0, 19.0, 27.0, 40.0, 66.0, 105.0, 188.0, 167.0, 132.0, 63.0, 45.0, 26.0, 25.0, 15.0, 17.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00026535987854003906, -0.0002579987049102783, -0.0002506375312805176, -0.00024327635765075684, -0.0002359151840209961, -0.00022855401039123535, -0.0002211928367614746, -0.00021383166313171387, -0.00020647048950195312, -0.00019910931587219238, -0.00019174814224243164, -0.0001843869686126709, -0.00017702579498291016, -0.00016966462135314941, -0.00016230344772338867, -0.00015494227409362793, -0.0001475811004638672, -0.00014021992683410645, -0.0001328587532043457, -0.00012549757957458496, -0.00011813640594482422, -0.00011077523231506348, -0.00010341405868530273, -9.605288505554199e-05, -8.869171142578125e-05, -8.133053779602051e-05, -7.396936416625977e-05, -6.660819053649902e-05, -5.924701690673828e-05, -5.188584327697754e-05, -4.45246696472168e-05, -3.7163496017456055e-05, -2.9802322387695312e-05, -2.244114875793457e-05, -1.5079975128173828e-05, -7.718801498413086e-06, -3.5762786865234375e-07, 7.0035457611083984e-06, 1.436471939086914e-05, 2.1725893020629883e-05, 2.9087066650390625e-05, 3.644824028015137e-05, 4.380941390991211e-05, 5.117058753967285e-05, 5.8531761169433594e-05, 6.589293479919434e-05, 7.325410842895508e-05, 8.061528205871582e-05, 8.797645568847656e-05, 9.53376293182373e-05, 0.00010269880294799805, 0.00011005997657775879, 0.00011742115020751953, 0.00012478232383728027, 0.00013214349746704102, 0.00013950467109680176, 0.0001468658447265625, 0.00015422701835632324, 0.00016158819198608398, 0.00016894936561584473, 0.00017631053924560547, 0.0001836717128753662, 0.00019103288650512695, 0.0001983940601348877, 0.00020575523376464844]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 6.0, 14.0, 15.0, 30.0, 46.0, 72.0, 94.0, 161.0, 298.0, 485.0, 933.0, 2152.0, 5285.0, 17101.0, 84366.0, 836735.0, 75606.0, 15860.0, 5082.0, 2115.0, 927.0, 463.0, 280.0, 144.0, 86.0, 52.0, 32.0, 35.0, 11.0, 10.0, 9.0, 13.0, 9.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4645576477050781, -0.45182037353515625, -0.4390830993652344, -0.4263458251953125, -0.4136085510253906, -0.40087127685546875, -0.3881340026855469, -0.375396728515625, -0.3626594543457031, -0.34992218017578125, -0.3371849060058594, -0.3244476318359375, -0.3117103576660156, -0.29897308349609375, -0.2862358093261719, -0.27349853515625, -0.2607612609863281, -0.24802398681640625, -0.23528671264648438, -0.2225494384765625, -0.20981216430664062, -0.19707489013671875, -0.18433761596679688, -0.171600341796875, -0.15886306762695312, -0.14612579345703125, -0.13338851928710938, -0.1206512451171875, -0.10791397094726562, -0.09517669677734375, -0.08243942260742188, -0.0697021484375, -0.056964874267578125, -0.04422760009765625, -0.031490325927734375, -0.0187530517578125, -0.006015777587890625, 0.00672149658203125, 0.019458770751953125, 0.032196044921875, 0.044933319091796875, 0.05767059326171875, 0.07040786743164062, 0.0831451416015625, 0.09588241577148438, 0.10861968994140625, 0.12135696411132812, 0.13409423828125, 0.14683151245117188, 0.15956878662109375, 0.17230606079101562, 0.1850433349609375, 0.19778060913085938, 0.21051788330078125, 0.22325515747070312, 0.235992431640625, 0.24872970581054688, 0.26146697998046875, 0.2742042541503906, 0.2869415283203125, 0.2996788024902344, 0.31241607666015625, 0.3251533508300781, 0.337890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 11.0, 10.0, 5.0, 10.0, 14.0, 23.0, 27.0, 35.0, 74.0, 142.0, 196.0, 197.0, 77.0, 42.0, 38.0, 20.0, 19.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0218505859375, -0.993896484375, -0.9659423828125, -0.93798828125, -0.9100341796875, -0.882080078125, -0.8541259765625, -0.826171875, -0.7982177734375, -0.770263671875, -0.7423095703125, -0.71435546875, -0.6864013671875, -0.658447265625, -0.6304931640625, -0.6025390625, -0.5745849609375, -0.546630859375, -0.5186767578125, -0.49072265625, -0.4627685546875, -0.434814453125, -0.4068603515625, -0.37890625, -0.3509521484375, -0.322998046875, -0.2950439453125, -0.26708984375, -0.2391357421875, -0.211181640625, -0.1832275390625, -0.1552734375, -0.1273193359375, -0.099365234375, -0.0714111328125, -0.04345703125, -0.0155029296875, 0.012451171875, 0.0404052734375, 0.068359375, 0.0963134765625, 0.124267578125, 0.1522216796875, 0.18017578125, 0.2081298828125, 0.236083984375, 0.2640380859375, 0.2919921875, 0.3199462890625, 0.347900390625, 0.3758544921875, 0.40380859375, 0.4317626953125, 0.459716796875, 0.4876708984375, 0.515625, 0.5435791015625, 0.571533203125, 0.5994873046875, 0.62744140625, 0.6553955078125, 0.683349609375, 0.7113037109375, 0.7392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 11.0, 25.0, 44.0, 149.0, 574.0, 112.0, 44.0, 28.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.82303810119629, -29.77545166015625, -28.727863311767578, -27.68027687072754, -26.6326904296875, -25.58510398864746, -24.537517547607422, -23.48992919921875, -22.44234275817871, -21.394756317138672, -20.34716796875, -19.29958152770996, -18.251995086669922, -17.204408645629883, -16.156822204589844, -15.109233856201172, -14.061647415161133, -13.014060974121094, -11.966473579406738, -10.918886184692383, -9.871299743652344, -8.823713302612305, -7.776125907897949, -6.728538990020752, -5.680952072143555, -4.633365154266357, -3.58577823638916, -2.538191318511963, -1.4906044006347656, -0.44301748275756836, 0.6045694351196289, 1.6521563529968262, 2.6997451782226562, 3.7473320960998535, 4.794919013977051, 5.842505931854248, 6.890092849731445, 7.937679767608643, 8.98526668548584, 10.032854080200195, 11.080440521240234, 12.128026962280273, 13.175614356994629, 14.223201751708984, 15.270788192749023, 16.318374633789062, 17.365962982177734, 18.413549423217773, 19.461135864257812, 20.50872230529785, 21.55630874633789, 22.603897094726562, 23.6514835357666, 24.69906997680664, 25.746658325195312, 26.79424476623535, 27.84183120727539, 28.88941764831543, 29.93700408935547, 30.98459243774414, 32.03218078613281, 33.07976531982422, 34.12735366821289, 35.1749382019043, 36.22252655029297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 8.0, 7.0, 9.0, 10.0, 7.0, 22.0, 12.0, 18.0, 19.0, 22.0, 21.0, 30.0, 45.0, 110.0, 165.0, 143.0, 109.0, 39.0, 26.0, 25.0, 17.0, 18.0, 18.0, 10.0, 11.0, 11.0, 17.0, 13.0, 4.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.334632873535156, -11.94738483428955, -11.560136795043945, -11.17288875579834, -10.785640716552734, -10.398392677307129, -10.011144638061523, -9.623896598815918, -9.236648559570312, -8.849400520324707, -8.462152481079102, -8.074904441833496, -7.687656402587891, -7.300408363342285, -6.91316032409668, -6.525912284851074, -6.1386637687683105, -5.751415729522705, -5.3641676902771, -4.976919651031494, -4.589671611785889, -4.202423572540283, -3.8151752948760986, -3.427927255630493, -3.0406792163848877, -2.6534311771392822, -2.2661831378936768, -1.8789349794387817, -1.4916869401931763, -1.1044389009475708, -0.7171907424926758, -0.3299427032470703, 0.057305335998535156, 0.444553405046463, 0.8318014740943909, 1.2190495729446411, 1.6062976121902466, 1.993545651435852, 2.380793809890747, 2.7680418491363525, 3.155289888381958, 3.5425379276275635, 3.929785966873169, 4.3170342445373535, 4.704282283782959, 5.0915303230285645, 5.47877836227417, 5.866026401519775, 6.253274440765381, 6.640522480010986, 7.027770519256592, 7.415018558502197, 7.802266597747803, 8.189515113830566, 8.576763153076172, 8.964011192321777, 9.351259231567383, 9.738507270812988, 10.125755310058594, 10.5130033493042, 10.900251388549805, 11.28749942779541, 11.674747467041016, 12.061995506286621, 12.449243545532227]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 9.0, 10.0, 12.0, 12.0, 18.0, 29.0, 17.0, 33.0, 34.0, 34.0, 55.0, 123.0, 250.0, 66.0, 33.0, 28.0, 25.0, 28.0, 19.0, 17.0, 14.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.078125, -1.0498580932617188, -1.0215911865234375, -0.9933242797851562, -0.965057373046875, -0.9367904663085938, -0.9085235595703125, -0.8802566528320312, -0.85198974609375, -0.8237228393554688, -0.7954559326171875, -0.7671890258789062, -0.738922119140625, -0.7106552124023438, -0.6823883056640625, -0.6541213989257812, -0.6258544921875, -0.5975875854492188, -0.5693206787109375, -0.5410537719726562, -0.512786865234375, -0.48451995849609375, -0.4562530517578125, -0.42798614501953125, -0.39971923828125, -0.37145233154296875, -0.3431854248046875, -0.31491851806640625, -0.286651611328125, -0.25838470458984375, -0.2301177978515625, -0.20185089111328125, -0.173583984375, -0.14531707763671875, -0.1170501708984375, -0.08878326416015625, -0.060516357421875, -0.03224945068359375, -0.0039825439453125, 0.02428436279296875, 0.05255126953125, 0.08081817626953125, 0.1090850830078125, 0.13735198974609375, 0.165618896484375, 0.19388580322265625, 0.2221527099609375, 0.25041961669921875, 0.2786865234375, 0.30695343017578125, 0.3352203369140625, 0.36348724365234375, 0.391754150390625, 0.42002105712890625, 0.4482879638671875, 0.47655487060546875, 0.50482177734375, 0.5330886840820312, 0.5613555908203125, 0.5896224975585938, 0.617889404296875, 0.6461563110351562, 0.6744232177734375, 0.7026901245117188, 0.73095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 18.0, 15.0, 27.0, 48.0, 99.0, 284.0, 1242.0, 9081.0, 8364688.0, 11113.0, 1319.0, 344.0, 145.0, 48.0, 31.0, 19.0, 5.0, 5.0, 11.0, 16.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0], "bins": [-14.428406715393066, -13.922683715820312, -13.416961669921875, -12.911238670349121, -12.405515670776367, -11.89979362487793, -11.394070625305176, -10.888347625732422, -10.382625579833984, -9.87690258026123, -9.371180534362793, -8.865457534790039, -8.359735488891602, -7.854012489318848, -7.348289489746094, -6.842566967010498, -6.336844444274902, -5.831121921539307, -5.325399398803711, -4.819676399230957, -4.313953876495361, -3.8082313537597656, -3.302508592605591, -2.796785831451416, -2.2910633087158203, -1.785340666770935, -1.2796180248260498, -0.7738953828811646, -0.2681727409362793, 0.2375497817993164, 0.7432725429534912, 1.248995304107666, 1.7547187805175781, 2.260441303253174, 2.7661640644073486, 3.2718868255615234, 3.777609348297119, 4.283331871032715, 4.789054870605469, 5.2947773933410645, 5.80049991607666, 6.306222438812256, 6.811944961547852, 7.3176679611206055, 7.823390483856201, 8.329113006591797, 8.83483600616455, 9.340559005737305, 9.846281051635742, 10.352004051208496, 10.857726097106934, 11.363449096679688, 11.869171142578125, 12.374894142150879, 12.880617141723633, 13.38633918762207, 13.892062187194824, 14.397785186767578, 14.903507232666016, 15.40923023223877, 15.914953231811523, 16.42067527770996, 16.9263973236084, 17.43212127685547, 17.937843322753906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 12.0, 8.0, 11.0, 4.0, 6.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.34786033630371, -17.9002742767334, -17.45269012451172, -17.005104064941406, -16.557518005371094, -16.10993194580078, -15.662347793579102, -15.214761734008789, -14.767176628112793, -14.319591522216797, -13.872005462646484, -13.424420356750488, -12.976835250854492, -12.52924919128418, -12.081664085388184, -11.634078979492188, -11.186492919921875, -10.738907814025879, -10.291321754455566, -9.84373664855957, -9.396150588989258, -8.948565483093262, -8.500980377197266, -8.053394317626953, -7.605809211730957, -7.158223628997803, -6.710638046264648, -6.263052940368652, -5.815467357635498, -5.367881774902344, -4.920296669006348, -4.472711086273193, -4.025124549865723, -3.5775389671325684, -3.129953622817993, -2.682368278503418, -2.2347826957702637, -1.7871971130371094, -1.3396117687225342, -0.892026424407959, -0.4444408416748047, 0.0031446218490600586, 0.4507300853729248, 0.8983155488967896, 1.3459010124206543, 1.7934865951538086, 2.241071939468384, 2.688657283782959, 3.1362428665161133, 3.5838284492492676, 4.031414031982422, 4.478999137878418, 4.926584720611572, 5.374170303344727, 5.821755409240723, 6.269340991973877, 6.716926574707031, 7.1645121574401855, 7.61209774017334, 8.059682846069336, 8.507268905639648, 8.954854011535645, 9.40243911743164, 9.850025177001953, 10.29761028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 10.0, 4.0, 11.0, 11.0, 16.0, 19.0, 27.0, 37.0, 52.0, 80.0, 132.0, 231.0, 402.0, 860.0, 1823.0, 3979.0, 10163.0, 28252.0, 90381.0, 212254.0, 117146.0, 36323.0, 12858.0, 4962.0, 2153.0, 957.0, 468.0, 268.0, 136.0, 69.0, 73.0, 24.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.984375, -7.76019287109375, -7.5360107421875, -7.31182861328125, -7.087646484375, -6.86346435546875, -6.6392822265625, -6.41510009765625, -6.19091796875, -5.96673583984375, -5.7425537109375, -5.51837158203125, -5.294189453125, -5.07000732421875, -4.8458251953125, -4.62164306640625, -4.3974609375, -4.17327880859375, -3.9490966796875, -3.72491455078125, -3.500732421875, -3.27655029296875, -3.0523681640625, -2.82818603515625, -2.60400390625, -2.37982177734375, -2.1556396484375, -1.93145751953125, -1.707275390625, -1.48309326171875, -1.2589111328125, -1.03472900390625, -0.810546875, -0.58636474609375, -0.3621826171875, -0.13800048828125, 0.086181640625, 0.31036376953125, 0.5345458984375, 0.75872802734375, 0.98291015625, 1.20709228515625, 1.4312744140625, 1.65545654296875, 1.879638671875, 2.10382080078125, 2.3280029296875, 2.55218505859375, 2.7763671875, 3.00054931640625, 3.2247314453125, 3.44891357421875, 3.673095703125, 3.89727783203125, 4.1214599609375, 4.34564208984375, 4.56982421875, 4.79400634765625, 5.0181884765625, 5.24237060546875, 5.466552734375, 5.69073486328125, 5.9149169921875, 6.13909912109375, 6.36328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 5.0, 8.0, 10.0, 9.0, 19.0, 23.0, 23.0, 33.0, 46.0, 49.0, 56.0, 59.0, 55.0, 71.0, 93.0, 84.0, 71.0, 60.0, 53.0, 33.0, 27.0, 21.0, 22.0, 17.0, 14.0, 6.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4498443603515625, -1.408477783203125, -1.3671112060546875, -1.32574462890625, -1.2843780517578125, -1.243011474609375, -1.2016448974609375, -1.1602783203125, -1.1189117431640625, -1.077545166015625, -1.0361785888671875, -0.99481201171875, -0.9534454345703125, -0.912078857421875, -0.8707122802734375, -0.829345703125, -0.7879791259765625, -0.746612548828125, -0.7052459716796875, -0.66387939453125, -0.6225128173828125, -0.581146240234375, -0.5397796630859375, -0.4984130859375, -0.4570465087890625, -0.415679931640625, -0.3743133544921875, -0.33294677734375, -0.2915802001953125, -0.250213623046875, -0.2088470458984375, -0.16748046875, -0.1261138916015625, -0.084747314453125, -0.0433807373046875, -0.00201416015625, 0.0393524169921875, 0.080718994140625, 0.1220855712890625, 0.1634521484375, 0.2048187255859375, 0.246185302734375, 0.2875518798828125, 0.32891845703125, 0.3702850341796875, 0.411651611328125, 0.4530181884765625, 0.494384765625, 0.5357513427734375, 0.577117919921875, 0.6184844970703125, 0.65985107421875, 0.7012176513671875, 0.742584228515625, 0.7839508056640625, 0.8253173828125, 0.8666839599609375, 0.908050537109375, 0.9494171142578125, 0.99078369140625, 1.0321502685546875, 1.073516845703125, 1.1148834228515625, 1.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 13.0, 4.0, 11.0, 21.0, 35.0, 62.0, 144.0, 121.0, 43.0, 15.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673454284667969, -9.242777824401855, -8.812101364135742, -8.381423950195312, -7.950747489929199, -7.520071029663086, -7.089394569396973, -6.658718109130859, -6.228041172027588, -5.797364711761475, -5.366687774658203, -4.93601131439209, -4.505334854125977, -4.074657917022705, -3.643981456756592, -3.2133047580718994, -2.782628059387207, -2.3519513607025146, -1.9212747812271118, -1.490598201751709, -1.0599215030670166, -0.6292448043823242, -0.19856834411621094, 0.23210835456848145, 0.6627850532531738, 1.0934617519378662, 1.524138331413269, 1.9548149108886719, 2.3854916095733643, 2.8161683082580566, 3.24684476852417, 3.6775214672088623, 4.108198165893555, 4.538874626159668, 4.9695515632629395, 5.400228023529053, 5.830904960632324, 6.2615814208984375, 6.692257881164551, 7.122934341430664, 7.5536112785339355, 7.984287738800049, 8.41496467590332, 8.845641136169434, 9.276317596435547, 9.706995010375977, 10.137670516967773, 10.568347930908203, 10.999024391174316, 11.42970085144043, 11.860377311706543, 12.291053771972656, 12.721731185913086, 13.1524076461792, 13.583084106445312, 14.013760566711426, 14.444437026977539, 14.875113487243652, 15.305789947509766, 15.736467361450195, 16.167142868041992, 16.597820281982422, 17.02849578857422, 17.45917320251465, 17.889850616455078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 9.0, 11.0, 20.0, 48.0, 66.0, 90.0, 73.0, 46.0, 31.0, 18.0, 5.0, 4.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.619020462036133, -6.4260993003845215, -6.23317813873291, -6.040256977081299, -5.8473358154296875, -5.654414176940918, -5.461493015289307, -5.268571853637695, -5.075650691986084, -4.882729530334473, -4.689808368682861, -4.49688720703125, -4.3039655685424805, -4.111044406890869, -3.918123245239258, -3.7252020835876465, -3.532280921936035, -3.339359760284424, -3.1464385986328125, -2.953517198562622, -2.7605960369110107, -2.5676748752593994, -2.374753475189209, -2.1818323135375977, -1.9889111518859863, -1.795989990234375, -1.6030687093734741, -1.4101474285125732, -1.217226266860962, -1.0243051052093506, -0.8313838243484497, -0.6384625434875488, -0.4455413818359375, -0.2526201605796814, -0.05969893932342529, 0.1332222819328308, 0.3261435031890869, 0.519064724445343, 0.7119859457015991, 0.9049072265625, 1.0978283882141113, 1.2907495498657227, 1.4836708307266235, 1.6765921115875244, 1.8695132732391357, 2.062434434890747, 2.2553558349609375, 2.448276996612549, 2.64119815826416, 2.8341193199157715, 3.027040481567383, 3.2199618816375732, 3.4128830432891846, 3.605804204940796, 3.7987256050109863, 3.9916467666625977, 4.184567928314209, 4.37748908996582, 4.570410251617432, 4.763331413269043, 4.9562530517578125, 5.149174213409424, 5.342095375061035, 5.5350165367126465, 5.727937698364258]}, "eval/loss": 4.745861530303955, "eval/wer": 1.976279254264181, "eval/runtime": 966.758, "eval/samples_per_second": 2.733, "eval/steps_per_second": 0.342, "train/train_runtime": 8574.3703, "train/train_samples_per_second": 3.328, "train/train_steps_per_second": 0.208, "train/total_flos": 0.0, "train/train_loss": 4.819954753590272} \ No newline at end of file +{"train/loss": 3.9784, "train/learning_rate": 9.345794392523364e-07, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 10001, "_timestamp": 1646221176, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 13.0, 17.0, 52.0, 415.0, 420.0, 70.0, 16.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-925.3422241210938, -902.2313232421875, -879.120361328125, -856.0094604492188, -832.8985595703125, -809.78759765625, -786.6766967773438, -763.5657958984375, -740.454833984375, -717.3439331054688, -694.2329711914062, -671.1220703125, -648.0111083984375, -624.9002075195312, -601.789306640625, -578.6783447265625, -555.5674438476562, -532.45654296875, -509.3455810546875, -486.23468017578125, -463.1237487792969, -440.0128173828125, -416.90191650390625, -393.7909851074219, -370.6800537109375, -347.5691223144531, -324.45819091796875, -301.3472900390625, -278.2363586425781, -255.12542724609375, -232.01451110839844, -208.90359497070312, -185.79266357421875, -162.68173217773438, -139.57081604003906, -116.45989227294922, -93.34896850585938, -70.23804473876953, -47.12712097167969, -24.016204833984375, -0.9052734375, 22.205650329589844, 45.31657409667969, 68.42749786376953, 91.53842163085938, 114.64934539794922, 137.76026916503906, 160.87118530273438, 183.98211669921875, 207.09304809570312, 230.20396423339844, 253.31488037109375, 276.4258117675781, 299.5367431640625, 322.64764404296875, 345.7585754394531, 368.8695068359375, 391.9804382324219, 415.09136962890625, 438.2022705078125, 461.3132019042969, 484.42413330078125, 507.5350341796875, 530.64599609375, 553.7568969726562]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 11.0, 7.0, 8.0, 15.0, 18.0, 21.0, 20.0, 18.0, 25.0, 30.0, 34.0, 27.0, 70.0, 176.0, 140.0, 82.0, 30.0, 23.0, 28.0, 28.0, 23.0, 23.0, 17.0, 17.0, 14.0, 13.0, 5.0, 7.0, 10.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-667.4768676757812, -646.577392578125, -625.6779174804688, -604.7784423828125, -583.8789672851562, -562.9794921875, -542.0800170898438, -521.1805419921875, -500.2810974121094, -479.3816223144531, -458.4821472167969, -437.5826721191406, -416.6832275390625, -395.78375244140625, -374.88427734375, -353.98480224609375, -333.0853271484375, -312.18585205078125, -291.286376953125, -270.38690185546875, -249.48744201660156, -228.5879669189453, -207.68850708007812, -186.78903198242188, -165.88955688476562, -144.99008178710938, -124.09061431884766, -103.19114685058594, -82.29167175292969, -61.39219665527344, -40.49272918701172, -19.59326171875, 1.30621337890625, 22.205684661865234, 43.10515594482422, 64.00462341308594, 84.90409851074219, 105.80357360839844, 126.70304107666016, 147.60250854492188, 168.50198364257812, 189.40145874023438, 210.30093383789062, 231.2003936767578, 252.09986877441406, 272.99932861328125, 293.8988037109375, 314.79827880859375, 335.69775390625, 356.59722900390625, 377.4967041015625, 398.39617919921875, 419.295654296875, 440.19512939453125, 461.0945739746094, 481.9940490722656, 502.8935241699219, 523.79296875, 544.6924438476562, 565.5919189453125, 586.4913940429688, 607.390869140625, 628.2903442382812, 649.1898193359375, 670.0892944335938]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 5.0, 10.0, 14.0, 11.0, 24.0, 20.0, 21.0, 19.0, 28.0, 39.0, 25.0, 67.0, 113.0, 133.0, 109.0, 60.0, 33.0, 24.0, 25.0, 24.0, 23.0, 21.0, 16.0, 22.0, 8.0, 11.0, 9.0, 5.0, 6.0, 9.0, 1.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.5013427734375, -10.143310546875, -9.7852783203125, -9.42724609375, -9.0692138671875, -8.711181640625, -8.3531494140625, -7.9951171875, -7.6370849609375, -7.279052734375, -6.9210205078125, -6.56298828125, -6.2049560546875, -5.846923828125, -5.4888916015625, -5.130859375, -4.7728271484375, -4.414794921875, -4.0567626953125, -3.69873046875, -3.3406982421875, -2.982666015625, -2.6246337890625, -2.2666015625, -1.9085693359375, -1.550537109375, -1.1925048828125, -0.83447265625, -0.4764404296875, -0.118408203125, 0.2396240234375, 0.59765625, 0.9556884765625, 1.313720703125, 1.6717529296875, 2.02978515625, 2.3878173828125, 2.745849609375, 3.1038818359375, 3.4619140625, 3.8199462890625, 4.177978515625, 4.5360107421875, 4.89404296875, 5.2520751953125, 5.610107421875, 5.9681396484375, 6.326171875, 6.6842041015625, 7.042236328125, 7.4002685546875, 7.75830078125, 8.1163330078125, 8.474365234375, 8.8323974609375, 9.1904296875, 9.5484619140625, 9.906494140625, 10.2645263671875, 10.62255859375, 10.9805908203125, 11.338623046875, 11.6966552734375, 12.0546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 14.0, 21.0, 33.0, 36.0, 59.0, 58.0, 72.0, 88.0, 145.0, 197.0, 306.0, 383.0, 600.0, 1027.0, 1953.0, 3929.0, 10399.0, 43091.0, 4044670.0, 65124.0, 12372.0, 4412.0, 2005.0, 1166.0, 640.0, 383.0, 269.0, 216.0, 166.0, 105.0, 78.0, 52.0, 40.0, 26.0, 31.0, 22.0, 17.0, 20.0, 7.0, 8.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-107.3125, -103.802734375, -100.29296875, -96.783203125, -93.2734375, -89.763671875, -86.25390625, -82.744140625, -79.234375, -75.724609375, -72.21484375, -68.705078125, -65.1953125, -61.685546875, -58.17578125, -54.666015625, -51.15625, -47.646484375, -44.13671875, -40.626953125, -37.1171875, -33.607421875, -30.09765625, -26.587890625, -23.078125, -19.568359375, -16.05859375, -12.548828125, -9.0390625, -5.529296875, -2.01953125, 1.490234375, 5.0, 8.509765625, 12.01953125, 15.529296875, 19.0390625, 22.548828125, 26.05859375, 29.568359375, 33.078125, 36.587890625, 40.09765625, 43.607421875, 47.1171875, 50.626953125, 54.13671875, 57.646484375, 61.15625, 64.666015625, 68.17578125, 71.685546875, 75.1953125, 78.705078125, 82.21484375, 85.724609375, 89.234375, 92.744140625, 96.25390625, 99.763671875, 103.2734375, 106.783203125, 110.29296875, 113.802734375, 117.3125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 10.0, 13.0, 22.0, 19.0, 20.0, 29.0, 35.0, 32.0, 57.0, 56.0, 87.0, 189.0, 439.0, 1039.0, 927.0, 489.0, 192.0, 102.0, 66.0, 42.0, 30.0, 28.0, 23.0, 11.0, 26.0, 13.0, 7.0, 13.0, 6.0, 2.0, 7.0, 2.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.0, -36.77294921875, -35.5458984375, -34.31884765625, -33.091796875, -31.86474609375, -30.6376953125, -29.41064453125, -28.18359375, -26.95654296875, -25.7294921875, -24.50244140625, -23.275390625, -22.04833984375, -20.8212890625, -19.59423828125, -18.3671875, -17.14013671875, -15.9130859375, -14.68603515625, -13.458984375, -12.23193359375, -11.0048828125, -9.77783203125, -8.55078125, -7.32373046875, -6.0966796875, -4.86962890625, -3.642578125, -2.41552734375, -1.1884765625, 0.03857421875, 1.265625, 2.49267578125, 3.7197265625, 4.94677734375, 6.173828125, 7.40087890625, 8.6279296875, 9.85498046875, 11.08203125, 12.30908203125, 13.5361328125, 14.76318359375, 15.990234375, 17.21728515625, 18.4443359375, 19.67138671875, 20.8984375, 22.12548828125, 23.3525390625, 24.57958984375, 25.806640625, 27.03369140625, 28.2607421875, 29.48779296875, 30.71484375, 31.94189453125, 33.1689453125, 34.39599609375, 35.623046875, 36.85009765625, 38.0771484375, 39.30419921875, 40.53125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 6.0, 10.0, 8.0, 18.0, 14.0, 23.0, 28.0, 37.0, 53.0, 71.0, 76.0, 82.0, 129.0, 175.0, 280.0, 496.0, 1232.0, 5414.0, 40811.0, 3830796.0, 292463.0, 17032.0, 2993.0, 821.0, 371.0, 210.0, 128.0, 105.0, 82.0, 67.0, 48.0, 45.0, 31.0, 22.0, 24.0, 10.0, 14.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-108.3125, -105.0107421875, -101.708984375, -98.4072265625, -95.10546875, -91.8037109375, -88.501953125, -85.2001953125, -81.8984375, -78.5966796875, -75.294921875, -71.9931640625, -68.69140625, -65.3896484375, -62.087890625, -58.7861328125, -55.484375, -52.1826171875, -48.880859375, -45.5791015625, -42.27734375, -38.9755859375, -35.673828125, -32.3720703125, -29.0703125, -25.7685546875, -22.466796875, -19.1650390625, -15.86328125, -12.5615234375, -9.259765625, -5.9580078125, -2.65625, 0.6455078125, 3.947265625, 7.2490234375, 10.55078125, 13.8525390625, 17.154296875, 20.4560546875, 23.7578125, 27.0595703125, 30.361328125, 33.6630859375, 36.96484375, 40.2666015625, 43.568359375, 46.8701171875, 50.171875, 53.4736328125, 56.775390625, 60.0771484375, 63.37890625, 66.6806640625, 69.982421875, 73.2841796875, 76.5859375, 79.8876953125, 83.189453125, 86.4912109375, 89.79296875, 93.0947265625, 96.396484375, 99.6982421875, 103.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 32.0, 28.0, 87.0, 247.0, 436.0, 126.0, 27.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-182.33505249023438, -174.4733428955078, -166.61163330078125, -158.74990844726562, -150.88819885253906, -143.0264892578125, -135.16477966308594, -127.30306243896484, -119.44134521484375, -111.57963562011719, -103.7179183959961, -95.85620880126953, -87.99449157714844, -80.13278198242188, -72.27107238769531, -64.40935516357422, -56.547645568847656, -48.68593215942383, -40.82421875, -32.96250915527344, -25.100793838500977, -17.23908233642578, -9.377368927001953, -1.515655517578125, 6.346057891845703, 14.207771301269531, 22.06948471069336, 29.931196212768555, 37.79290771484375, 45.65462112426758, 53.516334533691406, 61.378047943115234, 69.23976135253906, 77.10147094726562, 84.96318817138672, 92.82489776611328, 100.68661499023438, 108.54832458496094, 116.4100341796875, 124.2717514038086, 132.1334686279297, 139.99517822265625, 147.8568878173828, 155.71861267089844, 163.580322265625, 171.44203186035156, 179.30374145507812, 187.16546630859375, 195.02716064453125, 202.8888702392578, 210.75057983398438, 218.6123046875, 226.47401428222656, 234.33572387695312, 242.1974334716797, 250.05914306640625, 257.9208679199219, 265.7825927734375, 273.644287109375, 281.5060119628906, 289.3677062988281, 297.22943115234375, 305.0911560058594, 312.9528503417969, 320.8145751953125]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 13.0, 9.0, 15.0, 17.0, 19.0, 35.0, 24.0, 34.0, 32.0, 41.0, 29.0, 41.0, 39.0, 47.0, 45.0, 45.0, 40.0, 41.0, 40.0, 35.0, 36.0, 45.0, 33.0, 26.0, 21.0, 38.0, 20.0, 20.0, 17.0, 8.0, 11.0, 10.0, 8.0, 3.0, 11.0, 6.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.60552978515625, -139.92665100097656, -135.24777221679688, -130.5688934326172, -125.89002227783203, -121.21114349365234, -116.53227233886719, -111.8533935546875, -107.17451477050781, -102.49563598632812, -97.81675720214844, -93.13788604736328, -88.4590072631836, -83.7801284790039, -79.10125732421875, -74.42237854003906, -69.74349975585938, -65.06462097167969, -60.385746002197266, -55.706871032714844, -51.027992248535156, -46.34911346435547, -41.67023849487305, -36.991363525390625, -32.31248474121094, -27.633607864379883, -22.954730987548828, -18.275854110717773, -13.596977233886719, -8.918100357055664, -4.239223480224609, 0.4396514892578125, 5.1185302734375, 9.797407150268555, 14.47628402709961, 19.155160903930664, 23.83403778076172, 28.512914657592773, 33.19179153442383, 37.87066650390625, 42.54954528808594, 47.228424072265625, 51.90729904174805, 56.58617401123047, 61.265052795410156, 65.94393157958984, 70.622802734375, 75.30168151855469, 79.98056030273438, 84.65943908691406, 89.33831787109375, 94.0171890258789, 98.6960678100586, 103.37494659423828, 108.05381774902344, 112.73269653320312, 117.41157531738281, 122.0904541015625, 126.76933288574219, 131.44821166992188, 136.1270751953125, 140.8059539794922, 145.48483276367188, 150.16371154785156, 154.84259033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 12.0, 7.0, 14.0, 27.0, 34.0, 32.0, 72.0, 101.0, 167.0, 251.0, 349.0, 549.0, 899.0, 1281.0, 2107.0, 3302.0, 5285.0, 8595.0, 14270.0, 24499.0, 45156.0, 91610.0, 220269.0, 345453.0, 139140.0, 63874.0, 33210.0, 18630.0, 11075.0, 6694.0, 4237.0, 2608.0, 1642.0, 1056.0, 724.0, 435.0, 307.0, 176.0, 145.0, 83.0, 59.0, 34.0, 23.0, 15.0, 18.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2097492218017578, -0.20257949829101562, -0.19540977478027344, -0.18824005126953125, -0.18107032775878906, -0.17390060424804688, -0.1667308807373047, -0.1595611572265625, -0.1523914337158203, -0.14522171020507812, -0.13805198669433594, -0.13088226318359375, -0.12371253967285156, -0.11654281616210938, -0.10937309265136719, -0.102203369140625, -0.09503364562988281, -0.08786392211914062, -0.08069419860839844, -0.07352447509765625, -0.06635475158691406, -0.059185028076171875, -0.05201530456542969, -0.0448455810546875, -0.03767585754394531, -0.030506134033203125, -0.023336410522460938, -0.01616668701171875, -0.008996963500976562, -0.001827239990234375, 0.0053424835205078125, 0.01251220703125, 0.019681930541992188, 0.026851654052734375, 0.03402137756347656, 0.04119110107421875, 0.04836082458496094, 0.055530548095703125, 0.06270027160644531, 0.0698699951171875, 0.07703971862792969, 0.08420944213867188, 0.09137916564941406, 0.09854888916015625, 0.10571861267089844, 0.11288833618164062, 0.12005805969238281, 0.127227783203125, 0.1343975067138672, 0.14156723022460938, 0.14873695373535156, 0.15590667724609375, 0.16307640075683594, 0.17024612426757812, 0.1774158477783203, 0.1845855712890625, 0.1917552947998047, 0.19892501831054688, 0.20609474182128906, 0.21326446533203125, 0.22043418884277344, 0.22760391235351562, 0.2347736358642578, 0.241943359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 5.0, 11.0, 9.0, 11.0, 10.0, 17.0, 15.0, 17.0, 39.0, 33.0, 32.0, 27.0, 39.0, 32.0, 42.0, 39.0, 41.0, 1076.0, 44.0, 38.0, 35.0, 56.0, 32.0, 27.0, 36.0, 36.0, 36.0, 30.0, 24.0, 20.0, 18.0, 15.0, 5.0, 13.0, 10.0, 9.0, 12.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.83203125, -3.71209716796875, -3.5921630859375, -3.47222900390625, -3.352294921875, -3.23236083984375, -3.1124267578125, -2.99249267578125, -2.87255859375, -2.75262451171875, -2.6326904296875, -2.51275634765625, -2.392822265625, -2.27288818359375, -2.1529541015625, -2.03302001953125, -1.9130859375, -1.79315185546875, -1.6732177734375, -1.55328369140625, -1.433349609375, -1.31341552734375, -1.1934814453125, -1.07354736328125, -0.95361328125, -0.83367919921875, -0.7137451171875, -0.59381103515625, -0.473876953125, -0.35394287109375, -0.2340087890625, -0.11407470703125, 0.005859375, 0.12579345703125, 0.2457275390625, 0.36566162109375, 0.485595703125, 0.60552978515625, 0.7254638671875, 0.84539794921875, 0.96533203125, 1.08526611328125, 1.2052001953125, 1.32513427734375, 1.445068359375, 1.56500244140625, 1.6849365234375, 1.80487060546875, 1.9248046875, 2.04473876953125, 2.1646728515625, 2.28460693359375, 2.404541015625, 2.52447509765625, 2.6444091796875, 2.76434326171875, 2.88427734375, 3.00421142578125, 3.1241455078125, 3.24407958984375, 3.364013671875, 3.48394775390625, 3.6038818359375, 3.72381591796875, 3.84375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 6.0, 20.0, 23.0, 19.0, 32.0, 61.0, 103.0, 202.0, 247.0, 416.0, 651.0, 1078.0, 1692.0, 2530.0, 3929.0, 6618.0, 10139.0, 16359.0, 26951.0, 43944.0, 73001.0, 123554.0, 295003.0, 1173434.0, 125691.0, 74704.0, 44797.0, 27022.0, 16652.0, 10456.0, 6455.0, 4041.0, 2647.0, 1655.0, 1177.0, 669.0, 407.0, 248.0, 177.0, 96.0, 63.0, 56.0, 33.0, 18.0, 15.0, 16.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.07220458984375, -0.07001781463623047, -0.06783103942871094, -0.0656442642211914, -0.06345748901367188, -0.061270713806152344, -0.05908393859863281, -0.05689716339111328, -0.05471038818359375, -0.05252361297607422, -0.05033683776855469, -0.048150062561035156, -0.045963287353515625, -0.043776512145996094, -0.04158973693847656, -0.03940296173095703, -0.0372161865234375, -0.03502941131591797, -0.03284263610839844, -0.030655860900878906, -0.028469085693359375, -0.026282310485839844, -0.024095535278320312, -0.02190876007080078, -0.01972198486328125, -0.01753520965576172, -0.015348434448242188, -0.013161659240722656, -0.010974884033203125, -0.008788108825683594, -0.0066013336181640625, -0.004414558410644531, -0.002227783203125, -4.100799560546875e-05, 0.0021457672119140625, 0.004332542419433594, 0.006519317626953125, 0.008706092834472656, 0.010892868041992188, 0.013079643249511719, 0.01526641845703125, 0.01745319366455078, 0.019639968872070312, 0.021826744079589844, 0.024013519287109375, 0.026200294494628906, 0.028387069702148438, 0.03057384490966797, 0.0327606201171875, 0.03494739532470703, 0.03713417053222656, 0.039320945739746094, 0.041507720947265625, 0.043694496154785156, 0.04588127136230469, 0.04806804656982422, 0.05025482177734375, 0.05244159698486328, 0.05462837219238281, 0.056815147399902344, 0.059001922607421875, 0.061188697814941406, 0.06337547302246094, 0.06556224822998047, 0.0677490234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 15.0, 22.0, 28.0, 20.0, 20.0, 39.0, 54.0, 57.0, 48.0, 71.0, 92.0, 79.0, 69.0, 71.0, 44.0, 47.0, 42.0, 32.0, 16.0, 20.0, 12.0, 20.0, 8.0, 9.0, 11.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015306472778320312, -0.00014693289995193481, -0.0001408010721206665, -0.0001346692442893982, -0.00012853741645812988, -0.00012240558862686157, -0.00011627376079559326, -0.00011014193296432495, -0.00010401010513305664, -9.787827730178833e-05, -9.174644947052002e-05, -8.561462163925171e-05, -7.94827938079834e-05, -7.335096597671509e-05, -6.721913814544678e-05, -6.108731031417847e-05, -5.4955482482910156e-05, -4.8823654651641846e-05, -4.2691826820373535e-05, -3.6559998989105225e-05, -3.0428171157836914e-05, -2.4296343326568604e-05, -1.8164515495300293e-05, -1.2032687664031982e-05, -5.900859832763672e-06, 2.3096799850463867e-07, 6.362795829772949e-06, 1.249462366104126e-05, 1.862645149230957e-05, 2.475827932357788e-05, 3.089010715484619e-05, 3.70219349861145e-05, 4.315376281738281e-05, 4.928559064865112e-05, 5.5417418479919434e-05, 6.154924631118774e-05, 6.768107414245605e-05, 7.381290197372437e-05, 7.994472980499268e-05, 8.607655763626099e-05, 9.22083854675293e-05, 9.834021329879761e-05, 0.00010447204113006592, 0.00011060386896133423, 0.00011673569679260254, 0.00012286752462387085, 0.00012899935245513916, 0.00013513118028640747, 0.00014126300811767578, 0.0001473948359489441, 0.0001535266637802124, 0.0001596584916114807, 0.00016579031944274902, 0.00017192214727401733, 0.00017805397510528564, 0.00018418580293655396, 0.00019031763076782227, 0.00019644945859909058, 0.0002025812864303589, 0.0002087131142616272, 0.0002148449420928955, 0.00022097676992416382, 0.00022710859775543213, 0.00023324042558670044, 0.00023937225341796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 15.0, 16.0, 28.0, 33.0, 37.0, 68.0, 77.0, 91.0, 108.0, 180.0, 256.0, 399.0, 1135.0, 1041621.0, 2885.0, 497.0, 285.0, 224.0, 157.0, 75.0, 82.0, 64.0, 54.0, 28.0, 39.0, 29.0, 15.0, 15.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004215240478515625, -0.004086136817932129, -0.003957033157348633, -0.0038279294967651367, -0.0036988258361816406, -0.0035697221755981445, -0.0034406185150146484, -0.0033115148544311523, -0.0031824111938476562, -0.00305330753326416, -0.002924203872680664, -0.002795100212097168, -0.002665996551513672, -0.0025368928909301758, -0.0024077892303466797, -0.0022786855697631836, -0.0021495819091796875, -0.0020204782485961914, -0.0018913745880126953, -0.0017622709274291992, -0.0016331672668457031, -0.001504063606262207, -0.001374959945678711, -0.0012458562850952148, -0.0011167526245117188, -0.0009876489639282227, -0.0008585453033447266, -0.0007294416427612305, -0.0006003379821777344, -0.0004712343215942383, -0.0003421306610107422, -0.0002130270004272461, -8.392333984375e-05, 4.5180320739746094e-05, 0.0001742839813232422, 0.0003033876419067383, 0.0004324913024902344, 0.0005615949630737305, 0.0006906986236572266, 0.0008198022842407227, 0.0009489059448242188, 0.0010780096054077148, 0.001207113265991211, 0.001336216926574707, 0.0014653205871582031, 0.0015944242477416992, 0.0017235279083251953, 0.0018526315689086914, 0.0019817352294921875, 0.0021108388900756836, 0.0022399425506591797, 0.0023690462112426758, 0.002498149871826172, 0.002627253532409668, 0.002756357192993164, 0.00288546085357666, 0.0030145645141601562, 0.0031436681747436523, 0.0032727718353271484, 0.0034018754959106445, 0.0035309791564941406, 0.0036600828170776367, 0.003789186477661133, 0.003918290138244629, 0.004047393798828125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.665895928861573e-05, 2.276245504617691e-05, 8.218386938096955e-05, 0.00014160529826767743, 0.00020102670532651246, 0.0002604481123853475, 0.00031986954854801297, 0.000379290955606848, 0.00043871236266568303, 0.0004981337697245181, 0.0005575551767833531, 0.000616976642049849, 0.0006763980491086841, 0.0007358194561675191, 0.0007952408632263541, 0.0008546622702851892, 0.0009140836773440242, 0.0009735050844028592, 0.0010329264914616942, 0.0010923478985205293, 0.0011517693055793643, 0.0012111907126381993, 0.0012706122361123562, 0.0013300336431711912, 0.0013894549338147044, 0.0014488763408735394, 0.0015082977479323745, 0.0015677191549912095, 0.0016271405620500445, 0.0016865619691088796, 0.0017459834925830364, 0.0018054048996418715, 0.0018648263067007065, 0.0019242477137595415, 0.0019836691208183765, 0.0020430905278772116, 0.0021025119349360466, 0.0021619333419948816, 0.0022213547490537167, 0.0022807761561125517, 0.0023401975631713867, 0.0023996189702302217, 0.0024590403772890568, 0.002518461784347892, 0.002577883191406727, 0.002637304598465562, 0.002696726005524397, 0.002756147412583232, 0.002815568819642067, 0.002874990226700902, 0.002934411633759737, 0.002993833040818572, 0.003053254447877407, 0.003112675854936242, 0.003172097261995077, 0.003231518669053912, 0.003290940308943391, 0.003350361716002226, 0.003409783123061061, 0.003469204530119896, 0.003528625937178731, 0.003588047344237566, 0.003647468751296401, 0.003706890158355236, 0.003766311565414071]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 15.0, 11.0, 22.0, 27.0, 40.0, 53.0, 48.0, 77.0, 82.0, 97.0, 58.0, 94.0, 76.0, 69.0, 56.0, 47.0, 35.0, 30.0, 18.0, 9.0, 12.0, 15.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001519322395324707, -0.00014598481357097626, -0.0001400373876094818, -0.00013408996164798737, -0.00012814253568649292, -0.00012219510972499847, -0.00011624768376350403, -0.00011030025780200958, -0.00010435283184051514, -9.840540587902069e-05, -9.245797991752625e-05, -8.65105539560318e-05, -8.056312799453735e-05, -7.461570203304291e-05, -6.866827607154846e-05, -6.272085011005402e-05, -5.677342414855957e-05, -5.0825998187065125e-05, -4.487857222557068e-05, -3.893114626407623e-05, -3.298372030258179e-05, -2.703629434108734e-05, -2.1088868379592896e-05, -1.514144241809845e-05, -9.194016456604004e-06, -3.246590495109558e-06, 2.7008354663848877e-06, 8.648261427879333e-06, 1.459568738937378e-05, 2.0543113350868225e-05, 2.649053931236267e-05, 3.243796527385712e-05, 3.838539123535156e-05, 4.433281719684601e-05, 5.0280243158340454e-05, 5.62276691198349e-05, 6.217509508132935e-05, 6.812252104282379e-05, 7.406994700431824e-05, 8.001737296581268e-05, 8.596479892730713e-05, 9.191222488880157e-05, 9.785965085029602e-05, 0.00010380707681179047, 0.00010975450277328491, 0.00011570192873477936, 0.0001216493546962738, 0.00012759678065776825, 0.0001335442066192627, 0.00013949163258075714, 0.0001454390585422516, 0.00015138648450374603, 0.00015733391046524048, 0.00016328133642673492, 0.00016922876238822937, 0.00017517618834972382, 0.00018112361431121826, 0.0001870710402727127, 0.00019301846623420715, 0.0001989658921957016, 0.00020491331815719604, 0.0002108607441186905, 0.00021680817008018494, 0.00022275559604167938, 0.00022870302200317383]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 11.0, 17.0, 15.0, 33.0, 41.0, 53.0, 87.0, 105.0, 157.0, 181.0, 264.0, 365.0, 500.0, 749.0, 1109.0, 1650.0, 2760.0, 4670.0, 8910.0, 20372.0, 65274.0, 728714.0, 152277.0, 31795.0, 12404.0, 6218.0, 3351.0, 2094.0, 1351.0, 917.0, 573.0, 436.0, 290.0, 207.0, 177.0, 110.0, 87.0, 70.0, 42.0, 37.0, 27.0, 16.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.625, -37.36767578125, -36.1103515625, -34.85302734375, -33.595703125, -32.33837890625, -31.0810546875, -29.82373046875, -28.56640625, -27.30908203125, -26.0517578125, -24.79443359375, -23.537109375, -22.27978515625, -21.0224609375, -19.76513671875, -18.5078125, -17.25048828125, -15.9931640625, -14.73583984375, -13.478515625, -12.22119140625, -10.9638671875, -9.70654296875, -8.44921875, -7.19189453125, -5.9345703125, -4.67724609375, -3.419921875, -2.16259765625, -0.9052734375, 0.35205078125, 1.609375, 2.86669921875, 4.1240234375, 5.38134765625, 6.638671875, 7.89599609375, 9.1533203125, 10.41064453125, 11.66796875, 12.92529296875, 14.1826171875, 15.43994140625, 16.697265625, 17.95458984375, 19.2119140625, 20.46923828125, 21.7265625, 22.98388671875, 24.2412109375, 25.49853515625, 26.755859375, 28.01318359375, 29.2705078125, 30.52783203125, 31.78515625, 33.04248046875, 34.2998046875, 35.55712890625, 36.814453125, 38.07177734375, 39.3291015625, 40.58642578125, 41.84375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 11.0, 27.0, 24.0, 21.0, 26.0, 20.0, 29.0, 28.0, 36.0, 44.0, 46.0, 44.0, 59.0, 105.0, 281.0, 1538.0, 154.0, 86.0, 57.0, 32.0, 49.0, 31.0, 27.0, 35.0, 31.0, 27.0, 19.0, 21.0, 19.0, 11.0, 12.0, 10.0, 4.0, 5.0, 7.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.21875, -25.40380859375, -24.5888671875, -23.77392578125, -22.958984375, -22.14404296875, -21.3291015625, -20.51416015625, -19.69921875, -18.88427734375, -18.0693359375, -17.25439453125, -16.439453125, -15.62451171875, -14.8095703125, -13.99462890625, -13.1796875, -12.36474609375, -11.5498046875, -10.73486328125, -9.919921875, -9.10498046875, -8.2900390625, -7.47509765625, -6.66015625, -5.84521484375, -5.0302734375, -4.21533203125, -3.400390625, -2.58544921875, -1.7705078125, -0.95556640625, -0.140625, 0.67431640625, 1.4892578125, 2.30419921875, 3.119140625, 3.93408203125, 4.7490234375, 5.56396484375, 6.37890625, 7.19384765625, 8.0087890625, 8.82373046875, 9.638671875, 10.45361328125, 11.2685546875, 12.08349609375, 12.8984375, 13.71337890625, 14.5283203125, 15.34326171875, 16.158203125, 16.97314453125, 17.7880859375, 18.60302734375, 19.41796875, 20.23291015625, 21.0478515625, 21.86279296875, 22.677734375, 23.49267578125, 24.3076171875, 25.12255859375, 25.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 11.0, 13.0, 18.0, 18.0, 22.0, 35.0, 32.0, 45.0, 87.0, 114.0, 203.0, 562.0, 4534.0, 2598080.0, 537207.0, 3519.0, 475.0, 201.0, 118.0, 77.0, 56.0, 33.0, 34.0, 25.0, 23.0, 21.0, 20.0, 16.0, 11.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.0029296875, -99.318359375, -95.6337890625, -91.94921875, -88.2646484375, -84.580078125, -80.8955078125, -77.2109375, -73.5263671875, -69.841796875, -66.1572265625, -62.47265625, -58.7880859375, -55.103515625, -51.4189453125, -47.734375, -44.0498046875, -40.365234375, -36.6806640625, -32.99609375, -29.3115234375, -25.626953125, -21.9423828125, -18.2578125, -14.5732421875, -10.888671875, -7.2041015625, -3.51953125, 0.1650390625, 3.849609375, 7.5341796875, 11.21875, 14.9033203125, 18.587890625, 22.2724609375, 25.95703125, 29.6416015625, 33.326171875, 37.0107421875, 40.6953125, 44.3798828125, 48.064453125, 51.7490234375, 55.43359375, 59.1181640625, 62.802734375, 66.4873046875, 70.171875, 73.8564453125, 77.541015625, 81.2255859375, 84.91015625, 88.5947265625, 92.279296875, 95.9638671875, 99.6484375, 103.3330078125, 107.017578125, 110.7021484375, 114.38671875, 118.0712890625, 121.755859375, 125.4404296875, 129.125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 305.0, 468.0, 138.0, 32.0, 17.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-177.86587524414062, -172.7935791015625, -167.7212677001953, -162.64895629882812, -157.57666015625, -152.50436401367188, -147.4320526123047, -142.3597412109375, -137.28744506835938, -132.21514892578125, -127.14283752441406, -122.0705337524414, -116.99822998046875, -111.9259262084961, -106.85362243652344, -101.78131866455078, -96.70901489257812, -91.63671112060547, -86.56440734863281, -81.49210357666016, -76.4197998046875, -71.34749603271484, -66.27519226074219, -61.20288848876953, -56.130584716796875, -51.05828094482422, -45.98597717285156, -40.913673400878906, -35.84136962890625, -30.769065856933594, -25.696762084960938, -20.62445831298828, -15.552154541015625, -10.479850769042969, -5.4075469970703125, -0.33524322509765625, 4.737060546875, 9.809364318847656, 14.881668090820312, 19.95397186279297, 25.026275634765625, 30.09857940673828, 35.17088317871094, 40.243186950683594, 45.31549072265625, 50.387794494628906, 55.46009826660156, 60.53240203857422, 65.60470581054688, 70.67700958251953, 75.74931335449219, 80.82161712646484, 85.8939208984375, 90.96622467041016, 96.03852844238281, 101.11083221435547, 106.18313598632812, 111.25543975830078, 116.32774353027344, 121.4000473022461, 126.47235107421875, 131.54464721679688, 136.61695861816406, 141.68927001953125, 146.76156616210938]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 9.0, 11.0, 12.0, 18.0, 17.0, 28.0, 32.0, 31.0, 37.0, 45.0, 52.0, 49.0, 46.0, 61.0, 54.0, 65.0, 51.0, 52.0, 49.0, 55.0, 35.0, 30.0, 42.0, 28.0, 23.0, 14.0, 17.0, 9.0, 6.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.12557983398438, -114.09078216552734, -110.05598449707031, -106.02118682861328, -101.98638916015625, -97.95159149169922, -93.91679382324219, -89.88199615478516, -85.84719848632812, -81.8124008178711, -77.77760314941406, -73.74280548095703, -69.7080078125, -65.67321014404297, -61.63841247558594, -57.603614807128906, -53.568817138671875, -49.534019470214844, -45.49922180175781, -41.46442413330078, -37.42962646484375, -33.39482879638672, -29.360031127929688, -25.325233459472656, -21.290435791015625, -17.255638122558594, -13.220840454101562, -9.186042785644531, -5.1512451171875, -1.1164474487304688, 2.9183502197265625, 6.953147888183594, 10.987945556640625, 15.022743225097656, 19.057540893554688, 23.09233856201172, 27.12713623046875, 31.16193389892578, 35.19673156738281, 39.231529235839844, 43.266326904296875, 47.301124572753906, 51.33592224121094, 55.37071990966797, 59.405517578125, 63.44031524658203, 67.47511291503906, 71.5099105834961, 75.54470825195312, 79.57950592041016, 83.61430358886719, 87.64910125732422, 91.68389892578125, 95.71869659423828, 99.75349426269531, 103.78829193115234, 107.82308959960938, 111.8578872680664, 115.89268493652344, 119.92748260498047, 123.9622802734375, 127.99707794189453, 132.03187561035156, 136.06668090820312, 140.10147094726562]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 17.0, 7.0, 12.0, 7.0, 6.0, 11.0, 16.0, 21.0, 18.0, 14.0, 26.0, 35.0, 39.0, 57.0, 76.0, 85.0, 66.0, 83.0, 73.0, 51.0, 43.0, 27.0, 36.0, 22.0, 13.0, 23.0, 17.0, 15.0, 7.0, 10.0, 7.0, 9.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.409912109375, -8.09326171875, -7.776611328125, -7.4599609375, -7.143310546875, -6.82666015625, -6.510009765625, -6.193359375, -5.876708984375, -5.56005859375, -5.243408203125, -4.9267578125, -4.610107421875, -4.29345703125, -3.976806640625, -3.66015625, -3.343505859375, -3.02685546875, -2.710205078125, -2.3935546875, -2.076904296875, -1.76025390625, -1.443603515625, -1.126953125, -0.810302734375, -0.49365234375, -0.177001953125, 0.1396484375, 0.456298828125, 0.77294921875, 1.089599609375, 1.40625, 1.722900390625, 2.03955078125, 2.356201171875, 2.6728515625, 2.989501953125, 3.30615234375, 3.622802734375, 3.939453125, 4.256103515625, 4.57275390625, 4.889404296875, 5.2060546875, 5.522705078125, 5.83935546875, 6.156005859375, 6.47265625, 6.789306640625, 7.10595703125, 7.422607421875, 7.7392578125, 8.055908203125, 8.37255859375, 8.689208984375, 9.005859375, 9.322509765625, 9.63916015625, 9.955810546875, 10.2724609375, 10.589111328125, 10.90576171875, 11.222412109375, 11.5390625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 14.0, 9.0, 9.0, 22.0, 13.0, 22.0, 46.0, 44.0, 88.0, 110.0, 220.0, 316.0, 607.0, 1356.0, 3679.0, 17056.0, 3957117.0, 201234.0, 7942.0, 2257.0, 905.0, 415.0, 273.0, 170.0, 103.0, 50.0, 51.0, 25.0, 27.0, 20.0, 10.0, 9.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -76.6982421875, -73.833984375, -70.9697265625, -68.10546875, -65.2412109375, -62.376953125, -59.5126953125, -56.6484375, -53.7841796875, -50.919921875, -48.0556640625, -45.19140625, -42.3271484375, -39.462890625, -36.5986328125, -33.734375, -30.8701171875, -28.005859375, -25.1416015625, -22.27734375, -19.4130859375, -16.548828125, -13.6845703125, -10.8203125, -7.9560546875, -5.091796875, -2.2275390625, 0.63671875, 3.5009765625, 6.365234375, 9.2294921875, 12.09375, 14.9580078125, 17.822265625, 20.6865234375, 23.55078125, 26.4150390625, 29.279296875, 32.1435546875, 35.0078125, 37.8720703125, 40.736328125, 43.6005859375, 46.46484375, 49.3291015625, 52.193359375, 55.0576171875, 57.921875, 60.7861328125, 63.650390625, 66.5146484375, 69.37890625, 72.2431640625, 75.107421875, 77.9716796875, 80.8359375, 83.7001953125, 86.564453125, 89.4287109375, 92.29296875, 95.1572265625, 98.021484375, 100.8857421875, 103.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 2.0, 5.0, 6.0, 11.0, 9.0, 9.0, 13.0, 17.0, 33.0, 25.0, 38.0, 74.0, 125.0, 283.0, 601.0, 1021.0, 816.0, 403.0, 200.0, 95.0, 58.0, 41.0, 35.0, 20.0, 19.0, 16.0, 13.0, 11.0, 9.0, 8.0, 3.0, 4.0, 6.0, 8.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.4375, -28.537353515625, -27.63720703125, -26.737060546875, -25.8369140625, -24.936767578125, -24.03662109375, -23.136474609375, -22.236328125, -21.336181640625, -20.43603515625, -19.535888671875, -18.6357421875, -17.735595703125, -16.83544921875, -15.935302734375, -15.03515625, -14.135009765625, -13.23486328125, -12.334716796875, -11.4345703125, -10.534423828125, -9.63427734375, -8.734130859375, -7.833984375, -6.933837890625, -6.03369140625, -5.133544921875, -4.2333984375, -3.333251953125, -2.43310546875, -1.532958984375, -0.6328125, 0.267333984375, 1.16748046875, 2.067626953125, 2.9677734375, 3.867919921875, 4.76806640625, 5.668212890625, 6.568359375, 7.468505859375, 8.36865234375, 9.268798828125, 10.1689453125, 11.069091796875, 11.96923828125, 12.869384765625, 13.76953125, 14.669677734375, 15.56982421875, 16.469970703125, 17.3701171875, 18.270263671875, 19.17041015625, 20.070556640625, 20.970703125, 21.870849609375, 22.77099609375, 23.671142578125, 24.5712890625, 25.471435546875, 26.37158203125, 27.271728515625, 28.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 10.0, 6.0, 6.0, 11.0, 18.0, 21.0, 47.0, 46.0, 88.0, 136.0, 243.0, 485.0, 1025.0, 2727.0, 8026.0, 27596.0, 244579.0, 3791552.0, 91075.0, 17483.0, 5495.0, 1907.0, 751.0, 365.0, 199.0, 117.0, 69.0, 56.0, 34.0, 23.0, 18.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.75, -60.86767578125, -58.9853515625, -57.10302734375, -55.220703125, -53.33837890625, -51.4560546875, -49.57373046875, -47.69140625, -45.80908203125, -43.9267578125, -42.04443359375, -40.162109375, -38.27978515625, -36.3974609375, -34.51513671875, -32.6328125, -30.75048828125, -28.8681640625, -26.98583984375, -25.103515625, -23.22119140625, -21.3388671875, -19.45654296875, -17.57421875, -15.69189453125, -13.8095703125, -11.92724609375, -10.044921875, -8.16259765625, -6.2802734375, -4.39794921875, -2.515625, -0.63330078125, 1.2490234375, 3.13134765625, 5.013671875, 6.89599609375, 8.7783203125, 10.66064453125, 12.54296875, 14.42529296875, 16.3076171875, 18.18994140625, 20.072265625, 21.95458984375, 23.8369140625, 25.71923828125, 27.6015625, 29.48388671875, 31.3662109375, 33.24853515625, 35.130859375, 37.01318359375, 38.8955078125, 40.77783203125, 42.66015625, 44.54248046875, 46.4248046875, 48.30712890625, 50.189453125, 52.07177734375, 53.9541015625, 55.83642578125, 57.71875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 41.0, 203.0, 579.0, 122.0, 37.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.17376708984375, -286.0932312011719, -276.0126953125, -265.93212890625, -255.85159301757812, -245.77105712890625, -235.6905059814453, -225.60995483398438, -215.5294189453125, -205.44888305664062, -195.3683319091797, -185.28778076171875, -175.20724487304688, -165.126708984375, -155.04615783691406, -144.96560668945312, -134.88507080078125, -124.80452728271484, -114.72398376464844, -104.64344024658203, -94.56289672851562, -84.48235321044922, -74.40180969238281, -64.3212661743164, -54.24072265625, -44.160179138183594, -34.07963562011719, -23.99909210205078, -13.918548583984375, -3.8380050659179688, 6.2425384521484375, 16.323081970214844, 26.403656005859375, 36.48419952392578, 46.56474304199219, 56.645286560058594, 66.725830078125, 76.8063735961914, 86.88691711425781, 96.96746063232422, 107.04800415039062, 117.12854766845703, 127.20909118652344, 137.28964233398438, 147.37017822265625, 157.45071411132812, 167.53126525878906, 177.61181640625, 187.69235229492188, 197.77288818359375, 207.8534393310547, 217.93399047851562, 228.0145263671875, 238.09506225585938, 248.1756134033203, 258.25616455078125, 268.3367004394531, 278.417236328125, 288.497802734375, 298.5783386230469, 308.65887451171875, 318.7394104003906, 328.8199462890625, 338.9005126953125, 348.9810485839844]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 16.0, 24.0, 23.0, 26.0, 30.0, 39.0, 38.0, 41.0, 50.0, 48.0, 44.0, 44.0, 48.0, 40.0, 35.0, 38.0, 42.0, 41.0, 34.0, 23.0, 16.0, 20.0, 18.0, 20.0, 19.0, 23.0, 8.0, 10.0, 13.0, 8.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-89.58663940429688, -86.78866577148438, -83.99069213867188, -81.19271850585938, -78.39474487304688, -75.59677124023438, -72.79879760742188, -70.00081634521484, -67.20284271240234, -64.40486907958984, -61.606895446777344, -58.808921813964844, -56.01094436645508, -53.21297073364258, -50.41499710083008, -47.61701965332031, -44.81904983520508, -42.02107620239258, -39.22310256958008, -36.42512512207031, -33.62715148925781, -30.829177856445312, -28.031204223632812, -25.23322868347168, -22.43525505065918, -19.63728141784668, -16.839305877685547, -14.041332244873047, -11.24335765838623, -8.445383071899414, -5.647409439086914, -2.8494338989257812, -0.05146026611328125, 2.746514081954956, 5.544488430023193, 8.342462539672852, 11.140437126159668, 13.938411712646484, 16.736385345458984, 19.534360885620117, 22.332334518432617, 25.130308151245117, 27.92828369140625, 30.72625732421875, 33.52423095703125, 36.32220458984375, 39.12017822265625, 41.918155670166016, 44.716129302978516, 47.514102935791016, 50.312076568603516, 53.11005401611328, 55.90802764892578, 58.70600128173828, 61.50397491455078, 64.30194854736328, 67.09992218017578, 69.89789581298828, 72.69586944580078, 75.49384307861328, 78.29181671142578, 81.08979797363281, 83.88777160644531, 86.68574523925781, 89.48371887207031]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 9.0, 13.0, 22.0, 30.0, 36.0, 85.0, 112.0, 156.0, 267.0, 395.0, 610.0, 876.0, 1339.0, 2044.0, 3128.0, 4862.0, 7496.0, 11716.0, 19894.0, 34611.0, 64622.0, 130183.0, 278723.0, 240410.0, 111806.0, 56263.0, 30677.0, 17713.0, 10845.0, 6669.0, 4486.0, 2906.0, 1884.0, 1254.0, 816.0, 544.0, 344.0, 235.0, 179.0, 109.0, 58.0, 40.0, 33.0, 18.0, 9.0, 8.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17801284790039062, -0.17243194580078125, -0.16685104370117188, -0.1612701416015625, -0.15568923950195312, -0.15010833740234375, -0.14452743530273438, -0.138946533203125, -0.13336563110351562, -0.12778472900390625, -0.12220382690429688, -0.1166229248046875, -0.11104202270507812, -0.10546112060546875, -0.09988021850585938, -0.09429931640625, -0.08871841430664062, -0.08313751220703125, -0.07755661010742188, -0.0719757080078125, -0.06639480590820312, -0.06081390380859375, -0.055233001708984375, -0.049652099609375, -0.044071197509765625, -0.03849029541015625, -0.032909393310546875, -0.0273284912109375, -0.021747589111328125, -0.01616668701171875, -0.010585784912109375, -0.0050048828125, 0.000576019287109375, 0.00615692138671875, 0.011737823486328125, 0.0173187255859375, 0.022899627685546875, 0.02848052978515625, 0.034061431884765625, 0.039642333984375, 0.045223236083984375, 0.05080413818359375, 0.056385040283203125, 0.0619659423828125, 0.06754684448242188, 0.07312774658203125, 0.07870864868164062, 0.08428955078125, 0.08987045288085938, 0.09545135498046875, 0.10103225708007812, 0.1066131591796875, 0.11219406127929688, 0.11777496337890625, 0.12335586547851562, 0.128936767578125, 0.13451766967773438, 0.14009857177734375, 0.14567947387695312, 0.1512603759765625, 0.15684127807617188, 0.16242218017578125, 0.16800308227539062, 0.173583984375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 11.0, 21.0, 13.0, 19.0, 21.0, 38.0, 25.0, 32.0, 28.0, 42.0, 39.0, 35.0, 30.0, 48.0, 52.0, 1068.0, 47.0, 41.0, 38.0, 43.0, 33.0, 32.0, 36.0, 30.0, 28.0, 30.0, 22.0, 20.0, 13.0, 20.0, 11.0, 7.0, 12.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.043212890625, -3.91064453125, -3.778076171875, -3.6455078125, -3.512939453125, -3.38037109375, -3.247802734375, -3.115234375, -2.982666015625, -2.85009765625, -2.717529296875, -2.5849609375, -2.452392578125, -2.31982421875, -2.187255859375, -2.0546875, -1.922119140625, -1.78955078125, -1.656982421875, -1.5244140625, -1.391845703125, -1.25927734375, -1.126708984375, -0.994140625, -0.861572265625, -0.72900390625, -0.596435546875, -0.4638671875, -0.331298828125, -0.19873046875, -0.066162109375, 0.06640625, 0.198974609375, 0.33154296875, 0.464111328125, 0.5966796875, 0.729248046875, 0.86181640625, 0.994384765625, 1.126953125, 1.259521484375, 1.39208984375, 1.524658203125, 1.6572265625, 1.789794921875, 1.92236328125, 2.054931640625, 2.1875, 2.320068359375, 2.45263671875, 2.585205078125, 2.7177734375, 2.850341796875, 2.98291015625, 3.115478515625, 3.248046875, 3.380615234375, 3.51318359375, 3.645751953125, 3.7783203125, 3.910888671875, 4.04345703125, 4.176025390625, 4.30859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 3.0, 9.0, 10.0, 16.0, 32.0, 42.0, 55.0, 97.0, 124.0, 172.0, 258.0, 349.0, 519.0, 743.0, 1168.0, 1601.0, 2336.0, 3505.0, 4964.0, 7378.0, 10645.0, 15421.0, 23526.0, 34072.0, 49646.0, 73216.0, 112082.0, 177446.0, 1219606.0, 117368.0, 77149.0, 51968.0, 35445.0, 24223.0, 16378.0, 11198.0, 7675.0, 5247.0, 3501.0, 2421.0, 1684.0, 1191.0, 876.0, 524.0, 400.0, 262.0, 193.0, 109.0, 88.0, 78.0, 51.0, 24.0, 9.0, 10.0, 11.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.0557861328125, -0.05398988723754883, -0.052193641662597656, -0.050397396087646484, -0.04860115051269531, -0.04680490493774414, -0.04500865936279297, -0.0432124137878418, -0.041416168212890625, -0.03961992263793945, -0.03782367706298828, -0.03602743148803711, -0.03423118591308594, -0.032434940338134766, -0.030638694763183594, -0.028842449188232422, -0.02704620361328125, -0.025249958038330078, -0.023453712463378906, -0.021657466888427734, -0.019861221313476562, -0.01806497573852539, -0.01626873016357422, -0.014472484588623047, -0.012676239013671875, -0.010879993438720703, -0.009083747863769531, -0.007287502288818359, -0.0054912567138671875, -0.0036950111389160156, -0.0018987655639648438, -0.00010251998901367188, 0.0016937255859375, 0.003489971160888672, 0.005286216735839844, 0.007082462310791016, 0.008878707885742188, 0.01067495346069336, 0.012471199035644531, 0.014267444610595703, 0.016063690185546875, 0.017859935760498047, 0.01965618133544922, 0.02145242691040039, 0.023248672485351562, 0.025044918060302734, 0.026841163635253906, 0.028637409210205078, 0.03043365478515625, 0.03222990036010742, 0.034026145935058594, 0.035822391510009766, 0.03761863708496094, 0.03941488265991211, 0.04121112823486328, 0.04300737380981445, 0.044803619384765625, 0.0465998649597168, 0.04839611053466797, 0.05019235610961914, 0.05198860168457031, 0.053784847259521484, 0.055581092834472656, 0.05737733840942383, 0.059173583984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 5.0, 17.0, 19.0, 26.0, 25.0, 34.0, 35.0, 57.0, 57.0, 85.0, 67.0, 80.0, 72.0, 61.0, 63.0, 66.0, 59.0, 38.0, 30.0, 15.0, 15.0, 13.0, 9.0, 8.0, 6.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.00015756674110889435, -0.0001522935926914215, -0.00014702044427394867, -0.00014174729585647583, -0.000136474147439003, -0.00013120099902153015, -0.0001259278506040573, -0.00012065470218658447, -0.00011538155376911163, -0.0001101084053516388, -0.00010483525693416595, -9.956210851669312e-05, -9.428896009922028e-05, -8.901581168174744e-05, -8.37426632642746e-05, -7.846951484680176e-05, -7.319636642932892e-05, -6.792321801185608e-05, -6.265006959438324e-05, -5.73769211769104e-05, -5.210377275943756e-05, -4.683062434196472e-05, -4.155747592449188e-05, -3.628432750701904e-05, -3.1011179089546204e-05, -2.5738030672073364e-05, -2.0464882254600525e-05, -1.5191733837127686e-05, -9.918585419654846e-06, -4.645437002182007e-06, 6.277114152908325e-07, 5.900859832763672e-06, 1.1174008250236511e-05, 1.644715666770935e-05, 2.172030508518219e-05, 2.699345350265503e-05, 3.226660192012787e-05, 3.753975033760071e-05, 4.281289875507355e-05, 4.808604717254639e-05, 5.3359195590019226e-05, 5.8632344007492065e-05, 6.39054924249649e-05, 6.917864084243774e-05, 7.445178925991058e-05, 7.972493767738342e-05, 8.499808609485626e-05, 9.02712345123291e-05, 9.554438292980194e-05, 0.00010081753134727478, 0.00010609067976474762, 0.00011136382818222046, 0.0001166369765996933, 0.00012191012501716614, 0.00012718327343463898, 0.00013245642185211182, 0.00013772957026958466, 0.0001430027186870575, 0.00014827586710453033, 0.00015354901552200317, 0.000158822163939476, 0.00016409531235694885, 0.0001693684607744217, 0.00017464160919189453]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 14.0, 12.0, 10.0, 18.0, 20.0, 22.0, 42.0, 56.0, 70.0, 80.0, 94.0, 149.0, 227.0, 283.0, 490.0, 4432.0, 1033649.0, 7239.0, 528.0, 272.0, 221.0, 157.0, 140.0, 65.0, 49.0, 53.0, 28.0, 31.0, 18.0, 16.0, 15.0, 9.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0027408599853515625, -0.002651125192642212, -0.0025613903999328613, -0.0024716556072235107, -0.00238192081451416, -0.0022921860218048096, -0.002202451229095459, -0.0021127164363861084, -0.002022981643676758, -0.0019332468509674072, -0.0018435120582580566, -0.001753777265548706, -0.0016640424728393555, -0.0015743076801300049, -0.0014845728874206543, -0.0013948380947113037, -0.0013051033020019531, -0.0012153685092926025, -0.001125633716583252, -0.0010358989238739014, -0.0009461641311645508, -0.0008564293384552002, -0.0007666945457458496, -0.000676959753036499, -0.0005872249603271484, -0.0004974901676177979, -0.00040775537490844727, -0.0003180205821990967, -0.0002282857894897461, -0.0001385509967803955, -4.881620407104492e-05, 4.0918588638305664e-05, 0.00013065338134765625, 0.00022038817405700684, 0.0003101229667663574, 0.000399857759475708, 0.0004895925521850586, 0.0005793273448944092, 0.0006690621376037598, 0.0007587969303131104, 0.0008485317230224609, 0.0009382665157318115, 0.0010280013084411621, 0.0011177361011505127, 0.0012074708938598633, 0.0012972056865692139, 0.0013869404792785645, 0.001476675271987915, 0.0015664100646972656, 0.0016561448574066162, 0.0017458796501159668, 0.0018356144428253174, 0.001925349235534668, 0.0020150840282440186, 0.002104818820953369, 0.0021945536136627197, 0.0022842884063720703, 0.002374023199081421, 0.0024637579917907715, 0.002553492784500122, 0.0026432275772094727, 0.0027329623699188232, 0.002822697162628174, 0.0029124319553375244, 0.003002166748046875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [75.0, 925.0, 16.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.584178921300918e-05, -8.314827937283553e-06, 1.9212133338442072e-05, 4.6739092795178294e-05, 7.426605588989332e-05, 0.00010179301898460835, 0.00012931997480336577, 0.0001568469451740384, 0.00018437390099279583, 0.00021190085681155324, 0.00023942782718222588, 0.00026695476844906807, 0.00029448175337165594, 0.00032200870919041336, 0.00034953566500917077, 0.00037706264993175864, 0.0004045895766466856, 0.000432116532465443, 0.00045964348828420043, 0.0004871704732067883, 0.0005146973999217153, 0.0005422243848443031, 0.000569751369766891, 0.000597278296481818, 0.0006248052814044058, 0.0006523322663269937, 0.0006798591930419207, 0.0007073861779645085, 0.0007349131046794355, 0.0007624400896020234, 0.0007899670163169503, 0.0008174940012395382, 0.0008450209279544652, 0.000872547912877053, 0.00090007483959198, 0.0009276018245145679, 0.0009551287512294948, 0.0009826556779444218, 0.0010101826628670096, 0.0010377096477895975, 0.0010652366327121854, 0.0010927636176347733, 0.0011202906025573611, 0.0011478174710646272, 0.001175344455987215, 0.001202871440909803, 0.0012303984258323908, 0.0012579254107549787, 0.0012854522792622447, 0.0013129792641848326, 0.0013405062491074204, 0.0013680331176146865, 0.0013955601025372744, 0.0014230870874598622, 0.00145061407238245, 0.001478141057305038, 0.0015056680422276258, 0.0015331950271502137, 0.0015607220120728016, 0.0015882488805800676, 0.0016157758655026555, 0.0016433028504252434, 0.0016708298353478312, 0.0016983568202704191, 0.0017258836887776852]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 11.0, 10.0, 11.0, 18.0, 25.0, 18.0, 35.0, 35.0, 41.0, 62.0, 44.0, 34.0, 37.0, 43.0, 53.0, 45.0, 52.0, 46.0, 48.0, 60.0, 42.0, 26.0, 47.0, 33.0, 19.0, 14.0, 13.0, 13.0, 13.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.495019912719727e-05, -9.189825505018234e-05, -8.884631097316742e-05, -8.57943668961525e-05, -8.274242281913757e-05, -7.969047874212265e-05, -7.663853466510773e-05, -7.35865905880928e-05, -7.053464651107788e-05, -6.748270243406296e-05, -6.443075835704803e-05, -6.137881428003311e-05, -5.832687020301819e-05, -5.5274926126003265e-05, -5.222298204898834e-05, -4.917103797197342e-05, -4.6119093894958496e-05, -4.306714981794357e-05, -4.001520574092865e-05, -3.696326166391373e-05, -3.3911317586898804e-05, -3.085937350988388e-05, -2.7807429432868958e-05, -2.4755485355854034e-05, -2.170354127883911e-05, -1.8651597201824188e-05, -1.5599653124809265e-05, -1.2547709047794342e-05, -9.495764970779419e-06, -6.443820893764496e-06, -3.3918768167495728e-06, -3.3993273973464966e-07, 2.7120113372802734e-06, 5.7639554142951965e-06, 8.81589949131012e-06, 1.1867843568325043e-05, 1.4919787645339966e-05, 1.797173172235489e-05, 2.1023675799369812e-05, 2.4075619876384735e-05, 2.7127563953399658e-05, 3.017950803041458e-05, 3.3231452107429504e-05, 3.628339618444443e-05, 3.933534026145935e-05, 4.2387284338474274e-05, 4.54392284154892e-05, 4.849117249250412e-05, 5.154311656951904e-05, 5.4595060646533966e-05, 5.764700472354889e-05, 6.069894880056381e-05, 6.375089287757874e-05, 6.680283695459366e-05, 6.985478103160858e-05, 7.29067251086235e-05, 7.595866918563843e-05, 7.901061326265335e-05, 8.206255733966827e-05, 8.51145014166832e-05, 8.816644549369812e-05, 9.121838957071304e-05, 9.427033364772797e-05, 9.732227772474289e-05, 0.00010037422180175781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 6.0, 6.0, 19.0, 14.0, 27.0, 38.0, 42.0, 67.0, 85.0, 94.0, 139.0, 198.0, 270.0, 379.0, 508.0, 726.0, 1032.0, 1499.0, 2386.0, 3828.0, 7613.0, 20219.0, 111530.0, 801116.0, 64904.0, 15314.0, 6268.0, 3444.0, 2097.0, 1254.0, 973.0, 672.0, 498.0, 362.0, 242.0, 175.0, 128.0, 99.0, 87.0, 56.0, 52.0, 26.0, 29.0, 18.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.515625, -17.925537109375, -17.33544921875, -16.745361328125, -16.1552734375, -15.565185546875, -14.97509765625, -14.385009765625, -13.794921875, -13.204833984375, -12.61474609375, -12.024658203125, -11.4345703125, -10.844482421875, -10.25439453125, -9.664306640625, -9.07421875, -8.484130859375, -7.89404296875, -7.303955078125, -6.7138671875, -6.123779296875, -5.53369140625, -4.943603515625, -4.353515625, -3.763427734375, -3.17333984375, -2.583251953125, -1.9931640625, -1.403076171875, -0.81298828125, -0.222900390625, 0.3671875, 0.957275390625, 1.54736328125, 2.137451171875, 2.7275390625, 3.317626953125, 3.90771484375, 4.497802734375, 5.087890625, 5.677978515625, 6.26806640625, 6.858154296875, 7.4482421875, 8.038330078125, 8.62841796875, 9.218505859375, 9.80859375, 10.398681640625, 10.98876953125, 11.578857421875, 12.1689453125, 12.759033203125, 13.34912109375, 13.939208984375, 14.529296875, 15.119384765625, 15.70947265625, 16.299560546875, 16.8896484375, 17.479736328125, 18.06982421875, 18.659912109375, 19.25]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 11.0, 17.0, 11.0, 11.0, 16.0, 18.0, 12.0, 20.0, 31.0, 33.0, 36.0, 32.0, 37.0, 49.0, 38.0, 56.0, 80.0, 417.0, 1563.0, 79.0, 59.0, 34.0, 37.0, 45.0, 42.0, 35.0, 39.0, 17.0, 21.0, 25.0, 24.0, 12.0, 15.0, 11.0, 15.0, 4.0, 6.0, 7.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.42431640625, -30.4736328125, -29.52294921875, -28.572265625, -27.62158203125, -26.6708984375, -25.72021484375, -24.76953125, -23.81884765625, -22.8681640625, -21.91748046875, -20.966796875, -20.01611328125, -19.0654296875, -18.11474609375, -17.1640625, -16.21337890625, -15.2626953125, -14.31201171875, -13.361328125, -12.41064453125, -11.4599609375, -10.50927734375, -9.55859375, -8.60791015625, -7.6572265625, -6.70654296875, -5.755859375, -4.80517578125, -3.8544921875, -2.90380859375, -1.953125, -1.00244140625, -0.0517578125, 0.89892578125, 1.849609375, 2.80029296875, 3.7509765625, 4.70166015625, 5.65234375, 6.60302734375, 7.5537109375, 8.50439453125, 9.455078125, 10.40576171875, 11.3564453125, 12.30712890625, 13.2578125, 14.20849609375, 15.1591796875, 16.10986328125, 17.060546875, 18.01123046875, 18.9619140625, 19.91259765625, 20.86328125, 21.81396484375, 22.7646484375, 23.71533203125, 24.666015625, 25.61669921875, 26.5673828125, 27.51806640625, 28.46875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 10.0, 2.0, 4.0, 6.0, 9.0, 4.0, 13.0, 14.0, 19.0, 26.0, 29.0, 26.0, 35.0, 72.0, 90.0, 116.0, 206.0, 415.0, 833.0, 2446.0, 10272.0, 106567.0, 2984270.0, 31730.0, 5473.0, 1561.0, 592.0, 287.0, 168.0, 106.0, 69.0, 50.0, 41.0, 23.0, 21.0, 13.0, 22.0, 12.0, 11.0, 12.0, 10.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.28173828125, -47.4072265625, -45.53271484375, -43.658203125, -41.78369140625, -39.9091796875, -38.03466796875, -36.16015625, -34.28564453125, -32.4111328125, -30.53662109375, -28.662109375, -26.78759765625, -24.9130859375, -23.03857421875, -21.1640625, -19.28955078125, -17.4150390625, -15.54052734375, -13.666015625, -11.79150390625, -9.9169921875, -8.04248046875, -6.16796875, -4.29345703125, -2.4189453125, -0.54443359375, 1.330078125, 3.20458984375, 5.0791015625, 6.95361328125, 8.828125, 10.70263671875, 12.5771484375, 14.45166015625, 16.326171875, 18.20068359375, 20.0751953125, 21.94970703125, 23.82421875, 25.69873046875, 27.5732421875, 29.44775390625, 31.322265625, 33.19677734375, 35.0712890625, 36.94580078125, 38.8203125, 40.69482421875, 42.5693359375, 44.44384765625, 46.318359375, 48.19287109375, 50.0673828125, 51.94189453125, 53.81640625, 55.69091796875, 57.5654296875, 59.43994140625, 61.314453125, 63.18896484375, 65.0634765625, 66.93798828125, 68.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 961.0, 57.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7734260559082, -24.038291931152344, 7.696842193603516, 39.43197250366211, 71.1671142578125, 102.90225219726562, 134.6373748779297, 166.3725128173828, 198.10765075683594, 229.84278869628906, 261.5779113769531, 293.31304931640625, 325.0481872558594, 356.7833251953125, 388.5184326171875, 420.25360107421875, 451.98870849609375, 483.7238464355469, 515.458984375, 547.194091796875, 578.9292602539062, 610.6643676757812, 642.3995361328125, 674.1346435546875, 705.8698120117188, 737.6049194335938, 769.340087890625, 801.0751953125, 832.8103637695312, 864.5454711914062, 896.2806396484375, 928.0157470703125, 959.7508544921875, 991.4859619140625, 1023.2211303710938, 1054.956298828125, 1086.69140625, 1118.426513671875, 1150.16162109375, 1181.896728515625, 1213.6319580078125, 1245.3670654296875, 1277.1021728515625, 1308.83740234375, 1340.572509765625, 1372.3076171875, 1404.042724609375, 1435.77783203125, 1467.512939453125, 1499.248046875, 1530.983154296875, 1562.7183837890625, 1594.4534912109375, 1626.1885986328125, 1657.9237060546875, 1689.658935546875, 1721.39404296875, 1753.129150390625, 1784.8642578125, 1816.5994873046875, 1848.3345947265625, 1880.0697021484375, 1911.8048095703125, 1943.5400390625, 1975.275146484375]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 6.0, 8.0, 11.0, 12.0, 17.0, 19.0, 16.0, 18.0, 12.0, 24.0, 25.0, 37.0, 34.0, 49.0, 33.0, 49.0, 37.0, 29.0, 36.0, 36.0, 37.0, 43.0, 49.0, 36.0, 40.0, 42.0, 38.0, 34.0, 26.0, 19.0, 17.0, 19.0, 11.0, 14.0, 7.0, 13.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.44548034667969, -90.22933959960938, -87.01319885253906, -83.79705810546875, -80.5809097290039, -77.3647689819336, -74.14862823486328, -70.93248748779297, -67.71634674072266, -64.50020599365234, -61.284061431884766, -58.06792068481445, -54.85177993774414, -51.63563537597656, -48.41949462890625, -45.20335388183594, -41.98720932006836, -38.77106857299805, -35.55492401123047, -32.338783264160156, -29.122642517089844, -25.9064998626709, -22.690357208251953, -19.47421646118164, -16.258073806762695, -13.041932106018066, -9.825790405273438, -6.609647750854492, -3.3935060501098633, -0.17736434936523438, 3.038778305053711, 6.254919052124023, 9.471061706542969, 12.687203407287598, 15.903345108032227, 19.119487762451172, 22.335628509521484, 25.55177116394043, 28.767913818359375, 31.984054565429688, 35.2001953125, 38.41633605957031, 41.63248062133789, 44.8486213684082, 48.064762115478516, 51.280906677246094, 54.497047424316406, 57.71318817138672, 60.9293327331543, 64.14547729492188, 67.36161804199219, 70.5777587890625, 73.79389953613281, 77.01004028320312, 80.22618103027344, 83.44232177734375, 86.6584701538086, 89.8746109008789, 93.09075164794922, 96.30690002441406, 99.52304077148438, 102.73918151855469, 105.955322265625, 109.17146301269531, 112.38760375976562]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 6.0, 10.0, 9.0, 11.0, 6.0, 9.0, 11.0, 12.0, 16.0, 13.0, 18.0, 30.0, 30.0, 31.0, 42.0, 51.0, 71.0, 44.0, 82.0, 66.0, 66.0, 55.0, 54.0, 33.0, 29.0, 26.0, 26.0, 19.0, 21.0, 20.0, 8.0, 12.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.403076171875, -8.11083984375, -7.818603515625, -7.5263671875, -7.234130859375, -6.94189453125, -6.649658203125, -6.357421875, -6.065185546875, -5.77294921875, -5.480712890625, -5.1884765625, -4.896240234375, -4.60400390625, -4.311767578125, -4.01953125, -3.727294921875, -3.43505859375, -3.142822265625, -2.8505859375, -2.558349609375, -2.26611328125, -1.973876953125, -1.681640625, -1.389404296875, -1.09716796875, -0.804931640625, -0.5126953125, -0.220458984375, 0.07177734375, 0.364013671875, 0.65625, 0.948486328125, 1.24072265625, 1.532958984375, 1.8251953125, 2.117431640625, 2.40966796875, 2.701904296875, 2.994140625, 3.286376953125, 3.57861328125, 3.870849609375, 4.1630859375, 4.455322265625, 4.74755859375, 5.039794921875, 5.33203125, 5.624267578125, 5.91650390625, 6.208740234375, 6.5009765625, 6.793212890625, 7.08544921875, 7.377685546875, 7.669921875, 7.962158203125, 8.25439453125, 8.546630859375, 8.8388671875, 9.131103515625, 9.42333984375, 9.715576171875, 10.0078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 13.0, 14.0, 18.0, 27.0, 36.0, 45.0, 60.0, 73.0, 94.0, 154.0, 229.0, 364.0, 573.0, 992.0, 1903.0, 3919.0, 9249.0, 35531.0, 3168565.0, 935198.0, 22642.0, 7290.0, 3291.0, 1595.0, 851.0, 510.0, 314.0, 218.0, 130.0, 92.0, 67.0, 42.0, 35.0, 27.0, 24.0, 19.0, 16.0, 14.0, 11.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.9375, -42.5146484375, -41.091796875, -39.6689453125, -38.24609375, -36.8232421875, -35.400390625, -33.9775390625, -32.5546875, -31.1318359375, -29.708984375, -28.2861328125, -26.86328125, -25.4404296875, -24.017578125, -22.5947265625, -21.171875, -19.7490234375, -18.326171875, -16.9033203125, -15.48046875, -14.0576171875, -12.634765625, -11.2119140625, -9.7890625, -8.3662109375, -6.943359375, -5.5205078125, -4.09765625, -2.6748046875, -1.251953125, 0.1708984375, 1.59375, 3.0166015625, 4.439453125, 5.8623046875, 7.28515625, 8.7080078125, 10.130859375, 11.5537109375, 12.9765625, 14.3994140625, 15.822265625, 17.2451171875, 18.66796875, 20.0908203125, 21.513671875, 22.9365234375, 24.359375, 25.7822265625, 27.205078125, 28.6279296875, 30.05078125, 31.4736328125, 32.896484375, 34.3193359375, 35.7421875, 37.1650390625, 38.587890625, 40.0107421875, 41.43359375, 42.8564453125, 44.279296875, 45.7021484375, 47.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 6.0, 12.0, 9.0, 12.0, 21.0, 21.0, 15.0, 37.0, 38.0, 78.0, 130.0, 284.0, 641.0, 1100.0, 812.0, 375.0, 151.0, 96.0, 39.0, 38.0, 19.0, 22.0, 19.0, 21.0, 15.0, 15.0, 4.0, 10.0, 1.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.438720703125, -23.48681640625, -22.534912109375, -21.5830078125, -20.631103515625, -19.67919921875, -18.727294921875, -17.775390625, -16.823486328125, -15.87158203125, -14.919677734375, -13.9677734375, -13.015869140625, -12.06396484375, -11.112060546875, -10.16015625, -9.208251953125, -8.25634765625, -7.304443359375, -6.3525390625, -5.400634765625, -4.44873046875, -3.496826171875, -2.544921875, -1.593017578125, -0.64111328125, 0.310791015625, 1.2626953125, 2.214599609375, 3.16650390625, 4.118408203125, 5.0703125, 6.022216796875, 6.97412109375, 7.926025390625, 8.8779296875, 9.829833984375, 10.78173828125, 11.733642578125, 12.685546875, 13.637451171875, 14.58935546875, 15.541259765625, 16.4931640625, 17.445068359375, 18.39697265625, 19.348876953125, 20.30078125, 21.252685546875, 22.20458984375, 23.156494140625, 24.1083984375, 25.060302734375, 26.01220703125, 26.964111328125, 27.916015625, 28.867919921875, 29.81982421875, 30.771728515625, 31.7236328125, 32.675537109375, 33.62744140625, 34.579345703125, 35.53125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 15.0, 17.0, 28.0, 25.0, 63.0, 86.0, 125.0, 218.0, 438.0, 837.0, 1869.0, 4775.0, 14118.0, 52428.0, 1022673.0, 2992603.0, 75702.0, 17965.0, 5885.0, 2293.0, 985.0, 436.0, 263.0, 138.0, 101.0, 66.0, 31.0, 23.0, 17.0, 16.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -40.841796875, -39.27734375, -37.712890625, -36.1484375, -34.583984375, -33.01953125, -31.455078125, -29.890625, -28.326171875, -26.76171875, -25.197265625, -23.6328125, -22.068359375, -20.50390625, -18.939453125, -17.375, -15.810546875, -14.24609375, -12.681640625, -11.1171875, -9.552734375, -7.98828125, -6.423828125, -4.859375, -3.294921875, -1.73046875, -0.166015625, 1.3984375, 2.962890625, 4.52734375, 6.091796875, 7.65625, 9.220703125, 10.78515625, 12.349609375, 13.9140625, 15.478515625, 17.04296875, 18.607421875, 20.171875, 21.736328125, 23.30078125, 24.865234375, 26.4296875, 27.994140625, 29.55859375, 31.123046875, 32.6875, 34.251953125, 35.81640625, 37.380859375, 38.9453125, 40.509765625, 42.07421875, 43.638671875, 45.203125, 46.767578125, 48.33203125, 49.896484375, 51.4609375, 53.025390625, 54.58984375, 56.154296875, 57.71875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 9.0, 16.0, 39.0, 99.0, 177.0, 309.0, 223.0, 68.0, 36.0, 16.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.44499206542969, -43.59242248535156, -37.73985290527344, -31.887279510498047, -26.034709930419922, -20.182140350341797, -14.329566955566406, -8.476997375488281, -2.6244277954101562, 3.228142738342285, 9.080713272094727, 14.933284759521484, 20.78585433959961, 26.638423919677734, 32.490997314453125, 38.34356689453125, 44.196136474609375, 50.0487060546875, 55.901275634765625, 61.753849029541016, 67.60641479492188, 73.458984375, 79.31156158447266, 85.16413116455078, 91.0167007446289, 96.86927032470703, 102.72183990478516, 108.57441711425781, 114.42698669433594, 120.27955627441406, 126.13212585449219, 131.9846954345703, 137.83724975585938, 143.6898193359375, 149.54238891601562, 155.39495849609375, 161.24752807617188, 167.10009765625, 172.95266723632812, 178.80523681640625, 184.65780639648438, 190.5103759765625, 196.36294555664062, 202.21551513671875, 208.06808471679688, 213.920654296875, 219.77322387695312, 225.62579345703125, 231.47837829589844, 237.33094787597656, 243.1835174560547, 249.0360870361328, 254.88865661621094, 260.7412414550781, 266.59381103515625, 272.4463806152344, 278.2989501953125, 284.1515197753906, 290.00408935546875, 295.8566589355469, 301.709228515625, 307.5617980957031, 313.41436767578125, 319.2669372558594, 325.1195068359375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 10.0, 6.0, 13.0, 14.0, 12.0, 14.0, 25.0, 20.0, 23.0, 21.0, 28.0, 28.0, 30.0, 32.0, 24.0, 30.0, 35.0, 37.0, 43.0, 38.0, 41.0, 39.0, 41.0, 41.0, 42.0, 41.0, 27.0, 37.0, 22.0, 27.0, 21.0, 27.0, 16.0, 17.0, 9.0, 11.0, 8.0, 5.0, 6.0, 7.0, 1.0, 8.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-79.05381774902344, -76.65140533447266, -74.24899291992188, -71.84658813476562, -69.44417572021484, -67.04176330566406, -64.63935089111328, -62.2369384765625, -59.834529876708984, -57.4321174621582, -55.02970886230469, -52.627296447753906, -50.224884033203125, -47.82247543334961, -45.42006301879883, -43.01765441894531, -40.61524200439453, -38.21282958984375, -35.810420989990234, -33.40800857543945, -31.005598068237305, -28.603187561035156, -26.200775146484375, -23.798364639282227, -21.395954132080078, -18.99354362487793, -16.59113311767578, -14.188720703125, -11.786310195922852, -9.383899688720703, -6.981488227844238, -4.579076766967773, -2.176666259765625, 0.22574472427368164, 2.6281557083129883, 5.030566692352295, 7.432977676391602, 9.83538818359375, 12.237799644470215, 14.64021110534668, 17.042621612548828, 19.445032119750977, 21.847442626953125, 24.249855041503906, 26.652265548706055, 29.054676055908203, 31.457088470458984, 33.8594970703125, 36.26190948486328, 38.66432189941406, 41.06673049926758, 43.46914291381836, 45.871551513671875, 48.273963928222656, 50.67637634277344, 53.07878875732422, 55.481197357177734, 57.883609771728516, 60.28601837158203, 62.68843078613281, 65.0908432006836, 67.49325561523438, 69.89566040039062, 72.2980728149414, 74.70048522949219]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 16.0, 21.0, 29.0, 42.0, 58.0, 92.0, 140.0, 198.0, 291.0, 383.0, 602.0, 903.0, 1415.0, 2069.0, 3244.0, 5069.0, 7863.0, 12682.0, 20447.0, 33906.0, 58124.0, 105139.0, 200613.0, 265556.0, 140401.0, 76671.0, 43141.0, 25716.0, 15952.0, 9848.0, 6182.0, 4023.0, 2674.0, 1643.0, 1087.0, 731.0, 520.0, 318.0, 222.0, 157.0, 115.0, 79.0, 51.0, 30.0, 30.0, 20.0, 8.0, 5.0, 8.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16334915161132812, -0.15811920166015625, -0.15288925170898438, -0.1476593017578125, -0.14242935180664062, -0.13719940185546875, -0.13196945190429688, -0.126739501953125, -0.12150955200195312, -0.11627960205078125, -0.11104965209960938, -0.1058197021484375, -0.10058975219726562, -0.09535980224609375, -0.09012985229492188, -0.08489990234375, -0.07966995239257812, -0.07444000244140625, -0.06921005249023438, -0.0639801025390625, -0.058750152587890625, -0.05352020263671875, -0.048290252685546875, -0.043060302734375, -0.037830352783203125, -0.03260040283203125, -0.027370452880859375, -0.0221405029296875, -0.016910552978515625, -0.01168060302734375, -0.006450653076171875, -0.001220703125, 0.004009246826171875, 0.00923919677734375, 0.014469146728515625, 0.0196990966796875, 0.024929046630859375, 0.03015899658203125, 0.035388946533203125, 0.040618896484375, 0.045848846435546875, 0.05107879638671875, 0.056308746337890625, 0.0615386962890625, 0.06676864624023438, 0.07199859619140625, 0.07722854614257812, 0.08245849609375, 0.08768844604492188, 0.09291839599609375, 0.09814834594726562, 0.1033782958984375, 0.10860824584960938, 0.11383819580078125, 0.11906814575195312, 0.124298095703125, 0.12952804565429688, 0.13475799560546875, 0.13998794555664062, 0.1452178955078125, 0.15044784545898438, 0.15567779541015625, 0.16090774536132812, 0.1661376953125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 6.0, 7.0, 6.0, 9.0, 11.0, 19.0, 19.0, 22.0, 18.0, 27.0, 32.0, 27.0, 42.0, 32.0, 32.0, 48.0, 47.0, 41.0, 1066.0, 52.0, 50.0, 41.0, 48.0, 34.0, 41.0, 33.0, 25.0, 28.0, 29.0, 22.0, 14.0, 14.0, 9.0, 12.0, 8.0, 12.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.50140380859375, -4.3660888671875, -4.23077392578125, -4.095458984375, -3.96014404296875, -3.8248291015625, -3.68951416015625, -3.55419921875, -3.41888427734375, -3.2835693359375, -3.14825439453125, -3.012939453125, -2.87762451171875, -2.7423095703125, -2.60699462890625, -2.4716796875, -2.33636474609375, -2.2010498046875, -2.06573486328125, -1.930419921875, -1.79510498046875, -1.6597900390625, -1.52447509765625, -1.38916015625, -1.25384521484375, -1.1185302734375, -0.98321533203125, -0.847900390625, -0.71258544921875, -0.5772705078125, -0.44195556640625, -0.306640625, -0.17132568359375, -0.0360107421875, 0.09930419921875, 0.234619140625, 0.36993408203125, 0.5052490234375, 0.64056396484375, 0.77587890625, 0.91119384765625, 1.0465087890625, 1.18182373046875, 1.317138671875, 1.45245361328125, 1.5877685546875, 1.72308349609375, 1.8583984375, 1.99371337890625, 2.1290283203125, 2.26434326171875, 2.399658203125, 2.53497314453125, 2.6702880859375, 2.80560302734375, 2.94091796875, 3.07623291015625, 3.2115478515625, 3.34686279296875, 3.482177734375, 3.61749267578125, 3.7528076171875, 3.88812255859375, 4.0234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 9.0, 12.0, 19.0, 30.0, 31.0, 67.0, 93.0, 134.0, 203.0, 246.0, 413.0, 540.0, 826.0, 1162.0, 1765.0, 2486.0, 3837.0, 5561.0, 8392.0, 12643.0, 18930.0, 28477.0, 43976.0, 66942.0, 106046.0, 169602.0, 1250352.0, 132505.0, 83545.0, 53693.0, 35029.0, 23111.0, 15461.0, 10020.0, 6748.0, 4483.0, 3084.0, 2017.0, 1439.0, 972.0, 729.0, 440.0, 329.0, 207.0, 162.0, 119.0, 81.0, 59.0, 44.0, 26.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0650634765625, -0.06304550170898438, -0.06102752685546875, -0.059009552001953125, -0.0569915771484375, -0.054973602294921875, -0.05295562744140625, -0.050937652587890625, -0.048919677734375, -0.046901702880859375, -0.04488372802734375, -0.042865753173828125, -0.0408477783203125, -0.038829803466796875, -0.03681182861328125, -0.034793853759765625, -0.03277587890625, -0.030757904052734375, -0.02873992919921875, -0.026721954345703125, -0.0247039794921875, -0.022686004638671875, -0.02066802978515625, -0.018650054931640625, -0.016632080078125, -0.014614105224609375, -0.01259613037109375, -0.010578155517578125, -0.0085601806640625, -0.006542205810546875, -0.00452423095703125, -0.002506256103515625, -0.00048828125, 0.001529693603515625, 0.00354766845703125, 0.005565643310546875, 0.0075836181640625, 0.009601593017578125, 0.01161956787109375, 0.013637542724609375, 0.015655517578125, 0.017673492431640625, 0.01969146728515625, 0.021709442138671875, 0.0237274169921875, 0.025745391845703125, 0.02776336669921875, 0.029781341552734375, 0.03179931640625, 0.033817291259765625, 0.03583526611328125, 0.037853240966796875, 0.0398712158203125, 0.041889190673828125, 0.04390716552734375, 0.045925140380859375, 0.047943115234375, 0.049961090087890625, 0.05197906494140625, 0.053997039794921875, 0.0560150146484375, 0.058032989501953125, 0.06005096435546875, 0.062068939208984375, 0.0640869140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 4.0, 7.0, 7.0, 6.0, 12.0, 21.0, 18.0, 20.0, 26.0, 31.0, 38.0, 45.0, 62.0, 70.0, 74.0, 67.0, 77.0, 61.0, 60.0, 40.0, 50.0, 37.0, 30.0, 16.0, 25.0, 19.0, 17.0, 14.0, 5.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00015294551849365234, -0.00014812685549259186, -0.00014330819249153137, -0.00013848952949047089, -0.0001336708664894104, -0.00012885220348834991, -0.00012403354048728943, -0.00011921487748622894, -0.00011439621448516846, -0.00010957755148410797, -0.00010475888848304749, -9.9940225481987e-05, -9.512156248092651e-05, -9.030289947986603e-05, -8.548423647880554e-05, -8.066557347774506e-05, -7.584691047668457e-05, -7.102824747562408e-05, -6.62095844745636e-05, -6.139092147350311e-05, -5.657225847244263e-05, -5.175359547138214e-05, -4.6934932470321655e-05, -4.211626946926117e-05, -3.7297606468200684e-05, -3.24789434671402e-05, -2.7660280466079712e-05, -2.2841617465019226e-05, -1.802295446395874e-05, -1.3204291462898254e-05, -8.385628461837769e-06, -3.5669654607772827e-06, 1.2516975402832031e-06, 6.070360541343689e-06, 1.0889023542404175e-05, 1.570768654346466e-05, 2.0526349544525146e-05, 2.5345012545585632e-05, 3.0163675546646118e-05, 3.4982338547706604e-05, 3.980100154876709e-05, 4.4619664549827576e-05, 4.943832755088806e-05, 5.425699055194855e-05, 5.907565355300903e-05, 6.389431655406952e-05, 6.871297955513e-05, 7.353164255619049e-05, 7.835030555725098e-05, 8.316896855831146e-05, 8.798763155937195e-05, 9.280629456043243e-05, 9.762495756149292e-05, 0.0001024436205625534, 0.00010726228356361389, 0.00011208094656467438, 0.00011689960956573486, 0.00012171827256679535, 0.00012653693556785583, 0.00013135559856891632, 0.0001361742615699768, 0.0001409929245710373, 0.00014581158757209778, 0.00015063025057315826, 0.00015544891357421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 11.0, 7.0, 13.0, 19.0, 15.0, 26.0, 16.0, 33.0, 36.0, 61.0, 78.0, 90.0, 87.0, 134.0, 173.0, 224.0, 349.0, 1076.0, 35244.0, 999309.0, 9600.0, 678.0, 299.0, 199.0, 152.0, 135.0, 100.0, 72.0, 69.0, 58.0, 45.0, 22.0, 22.0, 19.0, 18.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.00244903564453125, -0.0023733675479888916, -0.002297699451446533, -0.002222031354904175, -0.0021463632583618164, -0.002070695161819458, -0.0019950270652770996, -0.0019193589687347412, -0.0018436908721923828, -0.0017680227756500244, -0.001692354679107666, -0.0016166865825653076, -0.0015410184860229492, -0.0014653503894805908, -0.0013896822929382324, -0.001314014196395874, -0.0012383460998535156, -0.0011626780033111572, -0.0010870099067687988, -0.0010113418102264404, -0.000935673713684082, -0.0008600056171417236, -0.0007843375205993652, -0.0007086694240570068, -0.0006330013275146484, -0.00055733323097229, -0.00048166513442993164, -0.00040599703788757324, -0.00033032894134521484, -0.00025466084480285645, -0.00017899274826049805, -0.00010332465171813965, -2.765655517578125e-05, 4.801154136657715e-05, 0.00012367963790893555, 0.00019934773445129395, 0.00027501583099365234, 0.00035068392753601074, 0.00042635202407836914, 0.0005020201206207275, 0.0005776882171630859, 0.0006533563137054443, 0.0007290244102478027, 0.0008046925067901611, 0.0008803606033325195, 0.0009560286998748779, 0.0010316967964172363, 0.0011073648929595947, 0.0011830329895019531, 0.0012587010860443115, 0.00133436918258667, 0.0014100372791290283, 0.0014857053756713867, 0.0015613734722137451, 0.0016370415687561035, 0.001712709665298462, 0.0017883777618408203, 0.0018640458583831787, 0.0019397139549255371, 0.0020153820514678955, 0.002091050148010254, 0.0021667182445526123, 0.0022423863410949707, 0.002318054437637329, 0.0023937225341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 21.0, 82.0, 391.0, 362.0, 85.0, 37.0, 12.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.0005354912136681378, -0.0005259194294922054, -0.0005163475871086121, -0.0005067758029326797, -0.0004972039605490863, -0.00048763214726932347, -0.0004780603339895606, -0.00046848852070979774, -0.0004589167074300349, -0.000449344894150272, -0.00043977308087050915, -0.0004302012675907463, -0.0004206294543109834, -0.00041105764103122056, -0.0004014858277514577, -0.0003919140144716948, -0.00038234220119193196, -0.0003727703879121691, -0.00036319857463240623, -0.00035362676135264337, -0.0003440549480728805, -0.00033448313479311764, -0.0003249113215133548, -0.0003153395082335919, -0.0003057677240576595, -0.00029619591077789664, -0.0002866240974981338, -0.0002770522842183709, -0.00026748047093860805, -0.0002579086576588452, -0.0002483368443790823, -0.00023876503109931946, -0.00022919323237147182, -0.00021962141909170896, -0.0002100496058119461, -0.00020047779253218323, -0.00019090597925242037, -0.0001813341659726575, -0.00017176236724480987, -0.000162190553965047, -0.00015261874068528414, -0.00014304692740552127, -0.0001334751141257584, -0.00012390330084599555, -0.00011433148756623268, -0.00010475967428646982, -9.518786828266457e-05, -8.56160550029017e-05, -7.604423444718122e-05, -6.647242116741836e-05, -5.6900607887655497e-05, -4.732879824587144e-05, -3.7756984966108575e-05, -2.818517168634571e-05, -1.8613362044561654e-05, -9.04154876479879e-06, 5.302645149640739e-07, 1.0102076885232236e-05, 1.96738892555004e-05, 2.924570071627386e-05, 3.881751399603672e-05, 4.838932727579959e-05, 5.7961136917583644e-05, 6.753295019734651e-05, 7.710476347710937e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 10.0, 9.0, 10.0, 15.0, 23.0, 27.0, 28.0, 28.0, 27.0, 29.0, 36.0, 51.0, 48.0, 29.0, 51.0, 43.0, 48.0, 43.0, 39.0, 41.0, 41.0, 28.0, 34.0, 32.0, 22.0, 35.0, 31.0, 24.0, 10.0, 14.0, 11.0, 8.0, 13.0, 11.0, 4.0, 6.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.738040924072266e-05, -8.438806980848312e-05, -8.139573037624359e-05, -7.840339094400406e-05, -7.541105151176453e-05, -7.2418712079525e-05, -6.942637264728546e-05, -6.643403321504593e-05, -6.34416937828064e-05, -6.0449354350566864e-05, -5.745701491832733e-05, -5.44646754860878e-05, -5.1472336053848267e-05, -4.8479996621608734e-05, -4.54876571893692e-05, -4.249531775712967e-05, -3.950297832489014e-05, -3.6510638892650604e-05, -3.351829946041107e-05, -3.052596002817154e-05, -2.7533620595932007e-05, -2.4541281163692474e-05, -2.1548941731452942e-05, -1.855660229921341e-05, -1.5564262866973877e-05, -1.2571923434734344e-05, -9.579584002494812e-06, -6.5872445702552795e-06, -3.594905138015747e-06, -6.025657057762146e-07, 2.389773726463318e-06, 5.38211315870285e-06, 8.374452590942383e-06, 1.1366792023181915e-05, 1.4359131455421448e-05, 1.735147088766098e-05, 2.0343810319900513e-05, 2.3336149752140045e-05, 2.6328489184379578e-05, 2.932082861661911e-05, 3.231316804885864e-05, 3.5305507481098175e-05, 3.829784691333771e-05, 4.129018634557724e-05, 4.428252577781677e-05, 4.7274865210056305e-05, 5.026720464229584e-05, 5.325954407453537e-05, 5.62518835067749e-05, 5.9244222939014435e-05, 6.223656237125397e-05, 6.52289018034935e-05, 6.822124123573303e-05, 7.121358066797256e-05, 7.42059201002121e-05, 7.719825953245163e-05, 8.019059896469116e-05, 8.31829383969307e-05, 8.617527782917023e-05, 8.916761726140976e-05, 9.215995669364929e-05, 9.515229612588882e-05, 9.814463555812836e-05, 0.00010113697499036789, 0.00010412931442260742]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 3.0, 6.0, 9.0, 10.0, 21.0, 26.0, 39.0, 47.0, 93.0, 111.0, 172.0, 251.0, 364.0, 525.0, 771.0, 1273.0, 2559.0, 7108.0, 52627.0, 909271.0, 59406.0, 7361.0, 2642.0, 1369.0, 805.0, 507.0, 371.0, 247.0, 172.0, 117.0, 88.0, 47.0, 50.0, 17.0, 16.0, 14.0, 11.0, 5.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.782958984375, -19.11279296875, -18.442626953125, -17.7724609375, -17.102294921875, -16.43212890625, -15.761962890625, -15.091796875, -14.421630859375, -13.75146484375, -13.081298828125, -12.4111328125, -11.740966796875, -11.07080078125, -10.400634765625, -9.73046875, -9.060302734375, -8.39013671875, -7.719970703125, -7.0498046875, -6.379638671875, -5.70947265625, -5.039306640625, -4.369140625, -3.698974609375, -3.02880859375, -2.358642578125, -1.6884765625, -1.018310546875, -0.34814453125, 0.322021484375, 0.9921875, 1.662353515625, 2.33251953125, 3.002685546875, 3.6728515625, 4.343017578125, 5.01318359375, 5.683349609375, 6.353515625, 7.023681640625, 7.69384765625, 8.364013671875, 9.0341796875, 9.704345703125, 10.37451171875, 11.044677734375, 11.71484375, 12.385009765625, 13.05517578125, 13.725341796875, 14.3955078125, 15.065673828125, 15.73583984375, 16.406005859375, 17.076171875, 17.746337890625, 18.41650390625, 19.086669921875, 19.7568359375, 20.427001953125, 21.09716796875, 21.767333984375, 22.4375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 9.0, 11.0, 15.0, 14.0, 18.0, 33.0, 27.0, 29.0, 31.0, 40.0, 35.0, 34.0, 45.0, 60.0, 106.0, 1716.0, 268.0, 85.0, 54.0, 44.0, 54.0, 35.0, 42.0, 28.0, 28.0, 30.0, 20.0, 15.0, 14.0, 15.0, 20.0, 12.0, 9.0, 4.0, 7.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.640625, -29.706298828125, -28.77197265625, -27.837646484375, -26.9033203125, -25.968994140625, -25.03466796875, -24.100341796875, -23.166015625, -22.231689453125, -21.29736328125, -20.363037109375, -19.4287109375, -18.494384765625, -17.56005859375, -16.625732421875, -15.69140625, -14.757080078125, -13.82275390625, -12.888427734375, -11.9541015625, -11.019775390625, -10.08544921875, -9.151123046875, -8.216796875, -7.282470703125, -6.34814453125, -5.413818359375, -4.4794921875, -3.545166015625, -2.61083984375, -1.676513671875, -0.7421875, 0.192138671875, 1.12646484375, 2.060791015625, 2.9951171875, 3.929443359375, 4.86376953125, 5.798095703125, 6.732421875, 7.666748046875, 8.60107421875, 9.535400390625, 10.4697265625, 11.404052734375, 12.33837890625, 13.272705078125, 14.20703125, 15.141357421875, 16.07568359375, 17.010009765625, 17.9443359375, 18.878662109375, 19.81298828125, 20.747314453125, 21.681640625, 22.615966796875, 23.55029296875, 24.484619140625, 25.4189453125, 26.353271484375, 27.28759765625, 28.221923828125, 29.15625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 17.0, 11.0, 18.0, 20.0, 21.0, 29.0, 27.0, 51.0, 71.0, 117.0, 219.0, 434.0, 974.0, 2438.0, 10508.0, 2923485.0, 198011.0, 5825.0, 1736.0, 754.0, 343.0, 178.0, 102.0, 67.0, 51.0, 49.0, 24.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.5625, -46.02001953125, -44.4775390625, -42.93505859375, -41.392578125, -39.85009765625, -38.3076171875, -36.76513671875, -35.22265625, -33.68017578125, -32.1376953125, -30.59521484375, -29.052734375, -27.51025390625, -25.9677734375, -24.42529296875, -22.8828125, -21.34033203125, -19.7978515625, -18.25537109375, -16.712890625, -15.17041015625, -13.6279296875, -12.08544921875, -10.54296875, -9.00048828125, -7.4580078125, -5.91552734375, -4.373046875, -2.83056640625, -1.2880859375, 0.25439453125, 1.796875, 3.33935546875, 4.8818359375, 6.42431640625, 7.966796875, 9.50927734375, 11.0517578125, 12.59423828125, 14.13671875, 15.67919921875, 17.2216796875, 18.76416015625, 20.306640625, 21.84912109375, 23.3916015625, 24.93408203125, 26.4765625, 28.01904296875, 29.5615234375, 31.10400390625, 32.646484375, 34.18896484375, 35.7314453125, 37.27392578125, 38.81640625, 40.35888671875, 41.9013671875, 43.44384765625, 44.986328125, 46.52880859375, 48.0712890625, 49.61376953125, 51.15625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 54.0, 385.0, 496.0, 61.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.58192443847656, -109.81767272949219, -104.05342864990234, -98.28917694091797, -92.52493286132812, -86.76068115234375, -80.99642944335938, -75.23218536376953, -69.46794128417969, -63.70369338989258, -57.93944549560547, -52.175193786621094, -46.41094970703125, -40.646697998046875, -34.882450103759766, -29.118202209472656, -23.35395050048828, -17.589702606201172, -11.825453758239746, -6.06120491027832, -0.29695701599121094, 5.467290878295898, 11.23154067993164, 16.99578857421875, 22.76003646850586, 28.52428436279297, 34.28853225708008, 40.05278015136719, 45.81703186035156, 51.581275939941406, 57.34552764892578, 63.10977554321289, 68.8740234375, 74.63827514648438, 80.40251922607422, 86.1667709350586, 91.93101501464844, 97.69526672363281, 103.45951843261719, 109.22376251220703, 114.98800659179688, 120.75225830078125, 126.5165023803711, 132.28074645996094, 138.0449981689453, 143.8092498779297, 149.57350158691406, 155.33773803710938, 161.10198974609375, 166.86624145507812, 172.6304931640625, 178.3947296142578, 184.1589813232422, 189.92323303222656, 195.68748474121094, 201.45172119140625, 207.2159881591797, 212.98023986816406, 218.74449157714844, 224.50872802734375, 230.27297973632812, 236.0372314453125, 241.80148315429688, 247.56573486328125, 253.32997131347656]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 12.0, 13.0, 18.0, 26.0, 24.0, 21.0, 21.0, 22.0, 33.0, 31.0, 40.0, 42.0, 39.0, 34.0, 42.0, 52.0, 55.0, 36.0, 46.0, 33.0, 43.0, 33.0, 38.0, 35.0, 31.0, 28.0, 23.0, 25.0, 16.0, 6.0, 18.0, 8.0, 5.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.51428985595703, -100.1222915649414, -96.73029327392578, -93.33828735351562, -89.9462890625, -86.55429077148438, -83.16229248046875, -79.77029418945312, -76.3782958984375, -72.98629760742188, -69.59429931640625, -66.20230102539062, -62.81029510498047, -59.418296813964844, -56.02629852294922, -52.634300231933594, -49.24229431152344, -45.85029602050781, -42.45829391479492, -39.0662956237793, -35.674293518066406, -32.28229522705078, -28.890296936035156, -25.4982967376709, -22.10629653930664, -18.714296340942383, -15.322297096252441, -11.9302978515625, -8.538297653198242, -5.146297454833984, -1.7542991638183594, 1.6377010345458984, 5.029701232910156, 8.421701431274414, 11.813700675964355, 15.205699920654297, 18.597700119018555, 21.989700317382812, 25.381698608398438, 28.773698806762695, 32.16569900512695, 35.55769729614258, 38.94969940185547, 42.341697692871094, 45.73369598388672, 49.12569808959961, 52.517696380615234, 55.909698486328125, 59.30169677734375, 62.693695068359375, 66.085693359375, 69.47769165039062, 72.86969757080078, 76.2616958618164, 79.65369415283203, 83.04569244384766, 86.43769836425781, 89.82969665527344, 93.22169494628906, 96.61369323730469, 100.00569915771484, 103.39769744873047, 106.7896957397461, 110.18169403076172, 113.57369232177734]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 7.0, 13.0, 8.0, 10.0, 14.0, 10.0, 17.0, 24.0, 22.0, 22.0, 41.0, 37.0, 46.0, 57.0, 54.0, 63.0, 71.0, 58.0, 64.0, 57.0, 42.0, 31.0, 32.0, 21.0, 29.0, 22.0, 17.0, 20.0, 11.0, 13.0, 9.0, 6.0, 4.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.62890625, -8.3359375, -8.04296875, -7.75, -7.45703125, -7.1640625, -6.87109375, -6.578125, -6.28515625, -5.9921875, -5.69921875, -5.40625, -5.11328125, -4.8203125, -4.52734375, -4.234375, -3.94140625, -3.6484375, -3.35546875, -3.0625, -2.76953125, -2.4765625, -2.18359375, -1.890625, -1.59765625, -1.3046875, -1.01171875, -0.71875, -0.42578125, -0.1328125, 0.16015625, 0.453125, 0.74609375, 1.0390625, 1.33203125, 1.625, 1.91796875, 2.2109375, 2.50390625, 2.796875, 3.08984375, 3.3828125, 3.67578125, 3.96875, 4.26171875, 4.5546875, 4.84765625, 5.140625, 5.43359375, 5.7265625, 6.01953125, 6.3125, 6.60546875, 6.8984375, 7.19140625, 7.484375, 7.77734375, 8.0703125, 8.36328125, 8.65625, 8.94921875, 9.2421875, 9.53515625, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 6.0, 11.0, 22.0, 38.0, 41.0, 51.0, 74.0, 99.0, 162.0, 273.0, 332.0, 539.0, 841.0, 1310.0, 2376.0, 4371.0, 8819.0, 27489.0, 698260.0, 3317458.0, 104353.0, 13454.0, 5952.0, 3182.0, 1726.0, 1023.0, 659.0, 439.0, 286.0, 172.0, 140.0, 89.0, 59.0, 39.0, 29.0, 25.0, 16.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.201416015625, -29.16845703125, -28.135498046875, -27.1025390625, -26.069580078125, -25.03662109375, -24.003662109375, -22.970703125, -21.937744140625, -20.90478515625, -19.871826171875, -18.8388671875, -17.805908203125, -16.77294921875, -15.739990234375, -14.70703125, -13.674072265625, -12.64111328125, -11.608154296875, -10.5751953125, -9.542236328125, -8.50927734375, -7.476318359375, -6.443359375, -5.410400390625, -4.37744140625, -3.344482421875, -2.3115234375, -1.278564453125, -0.24560546875, 0.787353515625, 1.8203125, 2.853271484375, 3.88623046875, 4.919189453125, 5.9521484375, 6.985107421875, 8.01806640625, 9.051025390625, 10.083984375, 11.116943359375, 12.14990234375, 13.182861328125, 14.2158203125, 15.248779296875, 16.28173828125, 17.314697265625, 18.34765625, 19.380615234375, 20.41357421875, 21.446533203125, 22.4794921875, 23.512451171875, 24.54541015625, 25.578369140625, 26.611328125, 27.644287109375, 28.67724609375, 29.710205078125, 30.7431640625, 31.776123046875, 32.80908203125, 33.842041015625, 34.875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 11.0, 21.0, 25.0, 42.0, 79.0, 156.0, 480.0, 1417.0, 1166.0, 349.0, 107.0, 55.0, 43.0, 29.0, 19.0, 15.0, 16.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -33.654296875, -32.24609375, -30.837890625, -29.4296875, -28.021484375, -26.61328125, -25.205078125, -23.796875, -22.388671875, -20.98046875, -19.572265625, -18.1640625, -16.755859375, -15.34765625, -13.939453125, -12.53125, -11.123046875, -9.71484375, -8.306640625, -6.8984375, -5.490234375, -4.08203125, -2.673828125, -1.265625, 0.142578125, 1.55078125, 2.958984375, 4.3671875, 5.775390625, 7.18359375, 8.591796875, 10.0, 11.408203125, 12.81640625, 14.224609375, 15.6328125, 17.041015625, 18.44921875, 19.857421875, 21.265625, 22.673828125, 24.08203125, 25.490234375, 26.8984375, 28.306640625, 29.71484375, 31.123046875, 32.53125, 33.939453125, 35.34765625, 36.755859375, 38.1640625, 39.572265625, 40.98046875, 42.388671875, 43.796875, 45.205078125, 46.61328125, 48.021484375, 49.4296875, 50.837890625, 52.24609375, 53.654296875, 55.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 15.0, 15.0, 33.0, 61.0, 90.0, 160.0, 396.0, 1100.0, 4279.0, 29231.0, 3601926.0, 536361.0, 16346.0, 2785.0, 837.0, 300.0, 136.0, 94.0, 48.0, 18.0, 17.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.3125, -102.4560546875, -99.599609375, -96.7431640625, -93.88671875, -91.0302734375, -88.173828125, -85.3173828125, -82.4609375, -79.6044921875, -76.748046875, -73.8916015625, -71.03515625, -68.1787109375, -65.322265625, -62.4658203125, -59.609375, -56.7529296875, -53.896484375, -51.0400390625, -48.18359375, -45.3271484375, -42.470703125, -39.6142578125, -36.7578125, -33.9013671875, -31.044921875, -28.1884765625, -25.33203125, -22.4755859375, -19.619140625, -16.7626953125, -13.90625, -11.0498046875, -8.193359375, -5.3369140625, -2.48046875, 0.3759765625, 3.232421875, 6.0888671875, 8.9453125, 11.8017578125, 14.658203125, 17.5146484375, 20.37109375, 23.2275390625, 26.083984375, 28.9404296875, 31.796875, 34.6533203125, 37.509765625, 40.3662109375, 43.22265625, 46.0791015625, 48.935546875, 51.7919921875, 54.6484375, 57.5048828125, 60.361328125, 63.2177734375, 66.07421875, 68.9306640625, 71.787109375, 74.6435546875, 77.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 67.0, 384.0, 447.0, 76.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.3537902832031, -335.4908447265625, -322.6278991699219, -309.76495361328125, -296.9020080566406, -284.0390625, -271.1761474609375, -258.31317138671875, -245.4502410888672, -232.58729553222656, -219.72434997558594, -206.86141967773438, -193.99847412109375, -181.13552856445312, -168.2725830078125, -155.40963745117188, -142.54669189453125, -129.68374633789062, -116.82080078125, -103.9578628540039, -91.09491729736328, -78.23197174072266, -65.36903381347656, -52.50608825683594, -39.64314270019531, -26.78019905090332, -13.917255401611328, -1.0543136596679688, 11.808631896972656, 24.67157745361328, 37.534515380859375, 50.3974609375, 63.260406494140625, 76.12335205078125, 88.98629760742188, 101.84923553466797, 114.7121810913086, 127.57512664794922, 140.4380645751953, 153.30101013183594, 166.16395568847656, 179.0269012451172, 191.8898468017578, 204.75277709960938, 217.61572265625, 230.47866821289062, 243.34161376953125, 256.2045593261719, 269.0675048828125, 281.9304504394531, 294.79339599609375, 307.6563415527344, 320.519287109375, 333.3822326660156, 346.24517822265625, 359.10809326171875, 371.9710693359375, 384.8340148925781, 397.69696044921875, 410.5599060058594, 423.4228515625, 436.2857971191406, 449.14874267578125, 462.01165771484375, 474.8746032714844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 8.0, 7.0, 15.0, 11.0, 7.0, 18.0, 18.0, 14.0, 21.0, 30.0, 34.0, 24.0, 38.0, 40.0, 33.0, 21.0, 29.0, 41.0, 39.0, 35.0, 38.0, 44.0, 37.0, 37.0, 41.0, 29.0, 32.0, 27.0, 27.0, 35.0, 18.0, 20.0, 21.0, 14.0, 14.0, 14.0, 13.0, 10.0, 6.0, 9.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-78.59513092041016, -76.32500457763672, -74.05488586425781, -71.78475952148438, -69.51463317871094, -67.2445068359375, -64.9743881225586, -62.704261779785156, -60.434139251708984, -58.16401672363281, -55.893890380859375, -53.6237678527832, -51.35364532470703, -49.083518981933594, -46.81339645385742, -44.54327392578125, -42.27314758300781, -40.00302505493164, -37.7328987121582, -35.46277618408203, -33.192649841308594, -30.922527313232422, -28.65240478515625, -26.382280349731445, -24.11215591430664, -21.842031478881836, -19.57190704345703, -17.30178451538086, -15.031660079956055, -12.76153564453125, -10.491412162780762, -8.221288681030273, -5.9511566162109375, -3.681032657623291, -1.4109086990356445, 0.859215259552002, 3.1293392181396484, 5.399463653564453, 7.669587135314941, 9.93971061706543, 12.209835052490234, 14.479959487915039, 16.750083923339844, 19.020206451416016, 21.29033088684082, 23.560455322265625, 25.830577850341797, 28.1007022857666, 30.370826721191406, 32.64094924926758, 34.911075592041016, 37.18119812011719, 39.451324462890625, 41.7214469909668, 43.99156951904297, 46.261695861816406, 48.53181838989258, 50.80194091796875, 53.07206726074219, 55.34218978881836, 57.61231231689453, 59.88243865966797, 62.15256118774414, 64.42268371582031, 66.69281005859375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 23.0, 21.0, 42.0, 57.0, 54.0, 99.0, 119.0, 215.0, 306.0, 377.0, 536.0, 776.0, 1119.0, 1593.0, 2320.0, 3214.0, 4743.0, 7189.0, 10487.0, 16367.0, 25248.0, 40103.0, 64931.0, 107957.0, 178207.0, 218938.0, 138440.0, 83256.0, 50114.0, 31307.0, 19854.0, 13069.0, 8577.0, 5915.0, 3894.0, 2781.0, 1831.0, 1316.0, 948.0, 660.0, 451.0, 321.0, 230.0, 134.0, 113.0, 91.0, 71.0, 37.0, 29.0, 23.0, 17.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0], "bins": [-0.147705078125, -0.14312362670898438, -0.13854217529296875, -0.13396072387695312, -0.1293792724609375, -0.12479782104492188, -0.12021636962890625, -0.11563491821289062, -0.111053466796875, -0.10647201538085938, -0.10189056396484375, -0.09730911254882812, -0.0927276611328125, -0.08814620971679688, -0.08356475830078125, -0.07898330688476562, -0.07440185546875, -0.06982040405273438, -0.06523895263671875, -0.060657501220703125, -0.0560760498046875, -0.051494598388671875, -0.04691314697265625, -0.042331695556640625, -0.037750244140625, -0.033168792724609375, -0.02858734130859375, -0.024005889892578125, -0.0194244384765625, -0.014842987060546875, -0.01026153564453125, -0.005680084228515625, -0.0010986328125, 0.003482818603515625, 0.00806427001953125, 0.012645721435546875, 0.0172271728515625, 0.021808624267578125, 0.02639007568359375, 0.030971527099609375, 0.035552978515625, 0.040134429931640625, 0.04471588134765625, 0.049297332763671875, 0.0538787841796875, 0.058460235595703125, 0.06304168701171875, 0.06762313842773438, 0.07220458984375, 0.07678604125976562, 0.08136749267578125, 0.08594894409179688, 0.0905303955078125, 0.09511184692382812, 0.09969329833984375, 0.10427474975585938, 0.108856201171875, 0.11343765258789062, 0.11801910400390625, 0.12260055541992188, 0.1271820068359375, 0.13176345825195312, 0.13634490966796875, 0.14092636108398438, 0.1455078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 6.0, 3.0, 8.0, 6.0, 13.0, 12.0, 12.0, 13.0, 17.0, 18.0, 22.0, 19.0, 22.0, 22.0, 33.0, 34.0, 40.0, 33.0, 40.0, 55.0, 43.0, 1060.0, 39.0, 32.0, 49.0, 35.0, 39.0, 34.0, 32.0, 31.0, 25.0, 18.0, 29.0, 15.0, 13.0, 17.0, 16.0, 11.0, 8.0, 12.0, 6.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1640625, -4.03155517578125, -3.8990478515625, -3.76654052734375, -3.634033203125, -3.50152587890625, -3.3690185546875, -3.23651123046875, -3.10400390625, -2.97149658203125, -2.8389892578125, -2.70648193359375, -2.573974609375, -2.44146728515625, -2.3089599609375, -2.17645263671875, -2.0439453125, -1.91143798828125, -1.7789306640625, -1.64642333984375, -1.513916015625, -1.38140869140625, -1.2489013671875, -1.11639404296875, -0.98388671875, -0.85137939453125, -0.7188720703125, -0.58636474609375, -0.453857421875, -0.32135009765625, -0.1888427734375, -0.05633544921875, 0.076171875, 0.20867919921875, 0.3411865234375, 0.47369384765625, 0.606201171875, 0.73870849609375, 0.8712158203125, 1.00372314453125, 1.13623046875, 1.26873779296875, 1.4012451171875, 1.53375244140625, 1.666259765625, 1.79876708984375, 1.9312744140625, 2.06378173828125, 2.1962890625, 2.32879638671875, 2.4613037109375, 2.59381103515625, 2.726318359375, 2.85882568359375, 2.9913330078125, 3.12384033203125, 3.25634765625, 3.38885498046875, 3.5213623046875, 3.65386962890625, 3.786376953125, 3.91888427734375, 4.0513916015625, 4.18389892578125, 4.31640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 6.0, 20.0, 18.0, 28.0, 35.0, 75.0, 111.0, 142.0, 192.0, 304.0, 374.0, 552.0, 822.0, 1129.0, 1591.0, 2174.0, 3037.0, 4247.0, 5870.0, 8328.0, 11657.0, 16433.0, 22950.0, 32903.0, 46501.0, 67251.0, 98673.0, 143971.0, 1216559.0, 126525.0, 86144.0, 58743.0, 40545.0, 28828.0, 20181.0, 14312.0, 10166.0, 7416.0, 5186.0, 3760.0, 2686.0, 1893.0, 1375.0, 994.0, 678.0, 503.0, 376.0, 269.0, 170.0, 143.0, 96.0, 73.0, 42.0, 31.0, 16.0, 8.0, 13.0, 8.0, 3.0, 5.0], "bins": [-0.0596923828125, -0.0578455924987793, -0.055998802185058594, -0.05415201187133789, -0.05230522155761719, -0.050458431243896484, -0.04861164093017578, -0.04676485061645508, -0.044918060302734375, -0.04307126998901367, -0.04122447967529297, -0.039377689361572266, -0.03753089904785156, -0.03568410873413086, -0.033837318420410156, -0.03199052810668945, -0.03014373779296875, -0.028296947479248047, -0.026450157165527344, -0.02460336685180664, -0.022756576538085938, -0.020909786224365234, -0.01906299591064453, -0.017216205596923828, -0.015369415283203125, -0.013522624969482422, -0.011675834655761719, -0.009829044342041016, -0.007982254028320312, -0.006135463714599609, -0.004288673400878906, -0.002441883087158203, -0.0005950927734375, 0.0012516975402832031, 0.0030984878540039062, 0.004945278167724609, 0.0067920684814453125, 0.008638858795166016, 0.010485649108886719, 0.012332439422607422, 0.014179229736328125, 0.016026020050048828, 0.01787281036376953, 0.019719600677490234, 0.021566390991210938, 0.02341318130493164, 0.025259971618652344, 0.027106761932373047, 0.02895355224609375, 0.030800342559814453, 0.032647132873535156, 0.03449392318725586, 0.03634071350097656, 0.038187503814697266, 0.04003429412841797, 0.04188108444213867, 0.043727874755859375, 0.04557466506958008, 0.04742145538330078, 0.049268245697021484, 0.05111503601074219, 0.05296182632446289, 0.054808616638183594, 0.0566554069519043, 0.058502197265625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 6.0, 17.0, 28.0, 19.0, 28.0, 36.0, 53.0, 43.0, 69.0, 72.0, 76.0, 70.0, 77.0, 80.0, 51.0, 64.0, 52.0, 32.0, 28.0, 29.0, 14.0, 10.0, 14.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027441978454589844, -0.00026644766330718994, -0.00025847554206848145, -0.00025050342082977295, -0.00024253129959106445, -0.00023455917835235596, -0.00022658705711364746, -0.00021861493587493896, -0.00021064281463623047, -0.00020267069339752197, -0.00019469857215881348, -0.00018672645092010498, -0.00017875432968139648, -0.000170782208442688, -0.0001628100872039795, -0.000154837965965271, -0.0001468658447265625, -0.000138893723487854, -0.0001309216022491455, -0.000122949481010437, -0.00011497735977172852, -0.00010700523853302002, -9.903311729431152e-05, -9.106099605560303e-05, -8.308887481689453e-05, -7.511675357818604e-05, -6.714463233947754e-05, -5.917251110076904e-05, -5.120038986206055e-05, -4.322826862335205e-05, -3.5256147384643555e-05, -2.728402614593506e-05, -1.9311904907226562e-05, -1.1339783668518066e-05, -3.3676624298095703e-06, 4.604458808898926e-06, 1.2576580047607422e-05, 2.0548701286315918e-05, 2.8520822525024414e-05, 3.649294376373291e-05, 4.4465065002441406e-05, 5.24371862411499e-05, 6.04093074798584e-05, 6.83814287185669e-05, 7.635354995727539e-05, 8.432567119598389e-05, 9.229779243469238e-05, 0.00010026991367340088, 0.00010824203491210938, 0.00011621415615081787, 0.00012418627738952637, 0.00013215839862823486, 0.00014013051986694336, 0.00014810264110565186, 0.00015607476234436035, 0.00016404688358306885, 0.00017201900482177734, 0.00017999112606048584, 0.00018796324729919434, 0.00019593536853790283, 0.00020390748977661133, 0.00021187961101531982, 0.00021985173225402832, 0.00022782385349273682, 0.0002357959747314453]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 4.0, 12.0, 19.0, 24.0, 33.0, 58.0, 70.0, 107.0, 131.0, 186.0, 252.0, 302.0, 746.0, 13932.0, 1024165.0, 6674.0, 629.0, 304.0, 258.0, 159.0, 126.0, 104.0, 69.0, 51.0, 41.0, 26.0, 17.0, 10.0, 11.0, 11.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003814697265625, -0.0036893486976623535, -0.003564000129699707, -0.0034386515617370605, -0.003313302993774414, -0.0031879544258117676, -0.003062605857849121, -0.0029372572898864746, -0.002811908721923828, -0.0026865601539611816, -0.002561211585998535, -0.0024358630180358887, -0.002310514450073242, -0.0021851658821105957, -0.0020598173141479492, -0.0019344687461853027, -0.0018091201782226562, -0.0016837716102600098, -0.0015584230422973633, -0.0014330744743347168, -0.0013077259063720703, -0.0011823773384094238, -0.0010570287704467773, -0.0009316802024841309, -0.0008063316345214844, -0.0006809830665588379, -0.0005556344985961914, -0.0004302859306335449, -0.00030493736267089844, -0.00017958879470825195, -5.424022674560547e-05, 7.110834121704102e-05, 0.0001964569091796875, 0.000321805477142334, 0.00044715404510498047, 0.000572502613067627, 0.0006978511810302734, 0.0008231997489929199, 0.0009485483169555664, 0.0010738968849182129, 0.0011992454528808594, 0.0013245940208435059, 0.0014499425888061523, 0.0015752911567687988, 0.0017006397247314453, 0.0018259882926940918, 0.0019513368606567383, 0.0020766854286193848, 0.0022020339965820312, 0.0023273825645446777, 0.0024527311325073242, 0.0025780797004699707, 0.002703428268432617, 0.0028287768363952637, 0.00295412540435791, 0.0030794739723205566, 0.003204822540283203, 0.0033301711082458496, 0.003455519676208496, 0.0035808682441711426, 0.003706216812133789, 0.0038315653800964355, 0.003956913948059082, 0.0040822625160217285, 0.004207611083984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 592.0, 376.0, 27.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009625245584174991, -0.0009280359954573214, -0.0008935473742894828, -0.0008590588113293052, -0.0008245701901614666, -0.0007900816272012889, -0.0007555930642411113, -0.0007211044430732727, -0.000686615880113095, -0.0006521273171529174, -0.0006176386959850788, -0.0005831501330249012, -0.0005486615700647235, -0.0005141729488968849, -0.00047968438593670726, -0.00044519579387269914, -0.000410707201808691, -0.0003762186097446829, -0.0003417300176806748, -0.00030724145472049713, -0.000272752862656489, -0.0002382642705924809, -0.000203775693080388, -0.00016928711556829512, -0.000134798523504287, -0.0001003099387162365, -6.5821353928186e-05, -3.13327691401355e-05, 3.1558156479150057e-06, 3.764440771192312e-05, 7.213298522401601e-05, 0.0001066215627361089, 0.0001411100383847952, 0.0001755986304488033, 0.0002100872079608962, 0.0002445757854729891, 0.0002790643775369972, 0.0003135529696010053, 0.000348041532561183, 0.0003825301246251911, 0.0004170187166891992, 0.0004515073087532073, 0.00048599590081721544, 0.0005204844637773931, 0.0005549730267375708, 0.0005894616479054093, 0.000623950210865587, 0.0006584387738257647, 0.0006929273949936032, 0.0007274159579537809, 0.0007619045791216195, 0.0007963931420817971, 0.0008308817632496357, 0.0008653703262098134, 0.000899858889169991, 0.0009343475103378296, 0.0009688360732980072, 0.001003324636258185, 0.0010378132574260235, 0.001072301878593862, 0.0011067903833463788, 0.0011412790045142174, 0.001175767625682056, 0.0012102561304345727, 0.0012447447516024113]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 2.0, 12.0, 11.0, 15.0, 15.0, 18.0, 19.0, 25.0, 25.0, 25.0, 25.0, 29.0, 27.0, 49.0, 38.0, 32.0, 29.0, 32.0, 49.0, 33.0, 44.0, 29.0, 36.0, 32.0, 36.0, 25.0, 36.0, 30.0, 31.0, 20.0, 25.0, 21.0, 17.0, 21.0, 10.0, 14.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0001232624053955078, -0.00011950545012950897, -0.00011574849486351013, -0.00011199153959751129, -0.00010823458433151245, -0.00010447762906551361, -0.00010072067379951477, -9.696371853351593e-05, -9.320676326751709e-05, -8.944980800151825e-05, -8.569285273551941e-05, -8.193589746952057e-05, -7.817894220352173e-05, -7.442198693752289e-05, -7.066503167152405e-05, -6.690807640552521e-05, -6.315112113952637e-05, -5.939416587352753e-05, -5.5637210607528687e-05, -5.1880255341529846e-05, -4.8123300075531006e-05, -4.4366344809532166e-05, -4.0609389543533325e-05, -3.6852434277534485e-05, -3.3095479011535645e-05, -2.9338523745536804e-05, -2.5581568479537964e-05, -2.1824613213539124e-05, -1.8067657947540283e-05, -1.4310702681541443e-05, -1.0553747415542603e-05, -6.796792149543762e-06, -3.039836883544922e-06, 7.171183824539185e-07, 4.474073648452759e-06, 8.231028914451599e-06, 1.198798418045044e-05, 1.574493944644928e-05, 1.950189471244812e-05, 2.325884997844696e-05, 2.70158052444458e-05, 3.077276051044464e-05, 3.452971577644348e-05, 3.828667104244232e-05, 4.204362630844116e-05, 4.580058157444e-05, 4.955753684043884e-05, 5.331449210643768e-05, 5.7071447372436523e-05, 6.0828402638435364e-05, 6.45853579044342e-05, 6.834231317043304e-05, 7.209926843643188e-05, 7.585622370243073e-05, 7.961317896842957e-05, 8.33701342344284e-05, 8.712708950042725e-05, 9.088404476642609e-05, 9.464100003242493e-05, 9.839795529842377e-05, 0.00010215491056442261, 0.00010591186583042145, 0.00010966882109642029, 0.00011342577636241913, 0.00011718273162841797]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 10.0, 18.0, 20.0, 25.0, 26.0, 45.0, 52.0, 88.0, 93.0, 125.0, 162.0, 255.0, 360.0, 546.0, 820.0, 1244.0, 2252.0, 4049.0, 7867.0, 20317.0, 133324.0, 795785.0, 52976.0, 13671.0, 6022.0, 3120.0, 1843.0, 1136.0, 685.0, 457.0, 285.0, 215.0, 150.0, 125.0, 89.0, 75.0, 53.0, 43.0, 25.0, 21.0, 14.0, 13.0, 16.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0625, -14.6103515625, -14.158203125, -13.7060546875, -13.25390625, -12.8017578125, -12.349609375, -11.8974609375, -11.4453125, -10.9931640625, -10.541015625, -10.0888671875, -9.63671875, -9.1845703125, -8.732421875, -8.2802734375, -7.828125, -7.3759765625, -6.923828125, -6.4716796875, -6.01953125, -5.5673828125, -5.115234375, -4.6630859375, -4.2109375, -3.7587890625, -3.306640625, -2.8544921875, -2.40234375, -1.9501953125, -1.498046875, -1.0458984375, -0.59375, -0.1416015625, 0.310546875, 0.7626953125, 1.21484375, 1.6669921875, 2.119140625, 2.5712890625, 3.0234375, 3.4755859375, 3.927734375, 4.3798828125, 4.83203125, 5.2841796875, 5.736328125, 6.1884765625, 6.640625, 7.0927734375, 7.544921875, 7.9970703125, 8.44921875, 8.9013671875, 9.353515625, 9.8056640625, 10.2578125, 10.7099609375, 11.162109375, 11.6142578125, 12.06640625, 12.5185546875, 12.970703125, 13.4228515625, 13.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 8.0, 10.0, 18.0, 17.0, 19.0, 25.0, 20.0, 26.0, 44.0, 41.0, 44.0, 49.0, 56.0, 57.0, 109.0, 1715.0, 260.0, 87.0, 60.0, 43.0, 49.0, 40.0, 31.0, 24.0, 32.0, 28.0, 24.0, 17.0, 12.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-33.1875, -32.234375, -31.28125, -30.328125, -29.375, -28.421875, -27.46875, -26.515625, -25.5625, -24.609375, -23.65625, -22.703125, -21.75, -20.796875, -19.84375, -18.890625, -17.9375, -16.984375, -16.03125, -15.078125, -14.125, -13.171875, -12.21875, -11.265625, -10.3125, -9.359375, -8.40625, -7.453125, -6.5, -5.546875, -4.59375, -3.640625, -2.6875, -1.734375, -0.78125, 0.171875, 1.125, 2.078125, 3.03125, 3.984375, 4.9375, 5.890625, 6.84375, 7.796875, 8.75, 9.703125, 10.65625, 11.609375, 12.5625, 13.515625, 14.46875, 15.421875, 16.375, 17.328125, 18.28125, 19.234375, 20.1875, 21.140625, 22.09375, 23.046875, 24.0, 24.953125, 25.90625, 26.859375, 27.8125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 5.0, 9.0, 7.0, 4.0, 13.0, 15.0, 21.0, 27.0, 37.0, 47.0, 65.0, 80.0, 126.0, 286.0, 601.0, 1521.0, 6901.0, 88240.0, 3002830.0, 38095.0, 4433.0, 1152.0, 473.0, 257.0, 134.0, 82.0, 52.0, 41.0, 31.0, 24.0, 23.0, 13.0, 14.0, 12.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-40.78125, -39.39306640625, -38.0048828125, -36.61669921875, -35.228515625, -33.84033203125, -32.4521484375, -31.06396484375, -29.67578125, -28.28759765625, -26.8994140625, -25.51123046875, -24.123046875, -22.73486328125, -21.3466796875, -19.95849609375, -18.5703125, -17.18212890625, -15.7939453125, -14.40576171875, -13.017578125, -11.62939453125, -10.2412109375, -8.85302734375, -7.46484375, -6.07666015625, -4.6884765625, -3.30029296875, -1.912109375, -0.52392578125, 0.8642578125, 2.25244140625, 3.640625, 5.02880859375, 6.4169921875, 7.80517578125, 9.193359375, 10.58154296875, 11.9697265625, 13.35791015625, 14.74609375, 16.13427734375, 17.5224609375, 18.91064453125, 20.298828125, 21.68701171875, 23.0751953125, 24.46337890625, 25.8515625, 27.23974609375, 28.6279296875, 30.01611328125, 31.404296875, 32.79248046875, 34.1806640625, 35.56884765625, 36.95703125, 38.34521484375, 39.7333984375, 41.12158203125, 42.509765625, 43.89794921875, 45.2861328125, 46.67431640625, 48.0625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [8.0, 784.0, 221.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.034774780273438, -11.262662887573242, 2.509449005126953, 16.28156280517578, 30.053672790527344, 43.825782775878906, 57.597900390625, 71.37001037597656, 85.14212036132812, 98.91423034667969, 112.68634033203125, 126.45845794677734, 140.23056030273438, 154.002685546875, 167.77479553222656, 181.54690551757812, 195.3190155029297, 209.09112548828125, 222.8632354736328, 236.63534545898438, 250.407470703125, 264.1795654296875, 277.9516906738281, 291.72381591796875, 305.49591064453125, 319.2680358886719, 333.0401306152344, 346.812255859375, 360.5843505859375, 374.3564758300781, 388.12860107421875, 401.90069580078125, 415.67279052734375, 429.4449157714844, 443.2170104980469, 456.9891357421875, 470.76123046875, 484.5333557128906, 498.30548095703125, 512.0775756835938, 525.8496704101562, 539.6217651367188, 553.3939208984375, 567.166015625, 580.9381103515625, 594.710205078125, 608.4823608398438, 622.2544555664062, 636.026611328125, 649.7987060546875, 663.5708618164062, 677.3429565429688, 691.1150512695312, 704.8871459960938, 718.6593017578125, 732.431396484375, 746.2034912109375, 759.9755859375, 773.7477416992188, 787.5198364257812, 801.2919311523438, 815.0640258789062, 828.836181640625, 842.6082763671875, 856.38037109375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 12.0, 24.0, 22.0, 30.0, 33.0, 32.0, 26.0, 34.0, 32.0, 40.0, 35.0, 44.0, 59.0, 43.0, 38.0, 39.0, 48.0, 44.0, 36.0, 35.0, 28.0, 34.0, 27.0, 20.0, 24.0, 15.0, 11.0, 12.0, 18.0, 8.0, 7.0, 3.0, 5.0, 7.0, 0.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-100.16007232666016, -97.13978576660156, -94.11949920654297, -91.0992202758789, -88.07893371582031, -85.05864715576172, -82.03836059570312, -79.01808166503906, -75.99779510498047, -72.97750854492188, -69.95722198486328, -66.93694305419922, -63.916656494140625, -60.89636993408203, -57.87608337402344, -54.85580062866211, -51.835514068603516, -48.81522750854492, -45.794944763183594, -42.774658203125, -39.75437545776367, -36.73408889770508, -33.71380615234375, -30.693519592285156, -27.673234939575195, -24.652950286865234, -21.632665634155273, -18.612380981445312, -15.592095375061035, -12.571810722351074, -9.551525115966797, -6.531240463256836, -3.510955810546875, -0.49067091941833496, 2.529613971710205, 5.549899101257324, 8.570183753967285, 11.590468406677246, 14.610754013061523, 17.631038665771484, 20.651323318481445, 23.671607971191406, 26.691892623901367, 29.712177276611328, 32.73246383666992, 35.75274658203125, 38.773033142089844, 41.79331970214844, 44.813602447509766, 47.83388900756836, 50.85417175292969, 53.87445831298828, 56.89474105834961, 59.9150276184082, 62.93531036376953, 65.95559692382812, 68.97588348388672, 71.99617004394531, 75.0164566040039, 78.03673553466797, 81.05702209472656, 84.07730865478516, 87.09759521484375, 90.11787414550781, 93.1381607055664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 10.0, 9.0, 12.0, 13.0, 7.0, 15.0, 17.0, 27.0, 24.0, 31.0, 33.0, 44.0, 39.0, 53.0, 52.0, 51.0, 69.0, 60.0, 53.0, 50.0, 46.0, 39.0, 36.0, 28.0, 31.0, 17.0, 21.0, 14.0, 15.0, 14.0, 18.0, 10.0, 9.0, 1.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.989501953125, -8.70556640625, -8.421630859375, -8.1376953125, -7.853759765625, -7.56982421875, -7.285888671875, -7.001953125, -6.718017578125, -6.43408203125, -6.150146484375, -5.8662109375, -5.582275390625, -5.29833984375, -5.014404296875, -4.73046875, -4.446533203125, -4.16259765625, -3.878662109375, -3.5947265625, -3.310791015625, -3.02685546875, -2.742919921875, -2.458984375, -2.175048828125, -1.89111328125, -1.607177734375, -1.3232421875, -1.039306640625, -0.75537109375, -0.471435546875, -0.1875, 0.096435546875, 0.38037109375, 0.664306640625, 0.9482421875, 1.232177734375, 1.51611328125, 1.800048828125, 2.083984375, 2.367919921875, 2.65185546875, 2.935791015625, 3.2197265625, 3.503662109375, 3.78759765625, 4.071533203125, 4.35546875, 4.639404296875, 4.92333984375, 5.207275390625, 5.4912109375, 5.775146484375, 6.05908203125, 6.343017578125, 6.626953125, 6.910888671875, 7.19482421875, 7.478759765625, 7.7626953125, 8.046630859375, 8.33056640625, 8.614501953125, 8.8984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 14.0, 19.0, 21.0, 36.0, 49.0, 52.0, 123.0, 181.0, 282.0, 443.0, 717.0, 1189.0, 2148.0, 3988.0, 8250.0, 21876.0, 359691.0, 3592159.0, 170352.0, 17483.0, 7069.0, 3536.0, 1893.0, 1037.0, 646.0, 406.0, 192.0, 139.0, 80.0, 72.0, 30.0, 32.0, 21.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.67919921875, -32.6396484375, -31.60009765625, -30.560546875, -29.52099609375, -28.4814453125, -27.44189453125, -26.40234375, -25.36279296875, -24.3232421875, -23.28369140625, -22.244140625, -21.20458984375, -20.1650390625, -19.12548828125, -18.0859375, -17.04638671875, -16.0068359375, -14.96728515625, -13.927734375, -12.88818359375, -11.8486328125, -10.80908203125, -9.76953125, -8.72998046875, -7.6904296875, -6.65087890625, -5.611328125, -4.57177734375, -3.5322265625, -2.49267578125, -1.453125, -0.41357421875, 0.6259765625, 1.66552734375, 2.705078125, 3.74462890625, 4.7841796875, 5.82373046875, 6.86328125, 7.90283203125, 8.9423828125, 9.98193359375, 11.021484375, 12.06103515625, 13.1005859375, 14.14013671875, 15.1796875, 16.21923828125, 17.2587890625, 18.29833984375, 19.337890625, 20.37744140625, 21.4169921875, 22.45654296875, 23.49609375, 24.53564453125, 25.5751953125, 26.61474609375, 27.654296875, 28.69384765625, 29.7333984375, 30.77294921875, 31.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 8.0, 5.0, 4.0, 10.0, 18.0, 13.0, 20.0, 25.0, 41.0, 39.0, 50.0, 99.0, 193.0, 373.0, 714.0, 961.0, 674.0, 317.0, 164.0, 71.0, 58.0, 27.0, 40.0, 24.0, 15.0, 26.0, 7.0, 11.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.296875, -24.516357421875, -23.73583984375, -22.955322265625, -22.1748046875, -21.394287109375, -20.61376953125, -19.833251953125, -19.052734375, -18.272216796875, -17.49169921875, -16.711181640625, -15.9306640625, -15.150146484375, -14.36962890625, -13.589111328125, -12.80859375, -12.028076171875, -11.24755859375, -10.467041015625, -9.6865234375, -8.906005859375, -8.12548828125, -7.344970703125, -6.564453125, -5.783935546875, -5.00341796875, -4.222900390625, -3.4423828125, -2.661865234375, -1.88134765625, -1.100830078125, -0.3203125, 0.460205078125, 1.24072265625, 2.021240234375, 2.8017578125, 3.582275390625, 4.36279296875, 5.143310546875, 5.923828125, 6.704345703125, 7.48486328125, 8.265380859375, 9.0458984375, 9.826416015625, 10.60693359375, 11.387451171875, 12.16796875, 12.948486328125, 13.72900390625, 14.509521484375, 15.2900390625, 16.070556640625, 16.85107421875, 17.631591796875, 18.412109375, 19.192626953125, 19.97314453125, 20.753662109375, 21.5341796875, 22.314697265625, 23.09521484375, 23.875732421875, 24.65625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 12.0, 15.0, 21.0, 24.0, 37.0, 55.0, 80.0, 112.0, 170.0, 239.0, 394.0, 579.0, 991.0, 1620.0, 2848.0, 5362.0, 10841.0, 24947.0, 76530.0, 751621.0, 3064432.0, 179383.0, 40918.0, 16001.0, 7619.0, 3890.0, 2113.0, 1257.0, 781.0, 501.0, 303.0, 168.0, 99.0, 63.0, 62.0, 46.0, 36.0, 27.0, 21.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.6875, -29.73583984375, -28.7841796875, -27.83251953125, -26.880859375, -25.92919921875, -24.9775390625, -24.02587890625, -23.07421875, -22.12255859375, -21.1708984375, -20.21923828125, -19.267578125, -18.31591796875, -17.3642578125, -16.41259765625, -15.4609375, -14.50927734375, -13.5576171875, -12.60595703125, -11.654296875, -10.70263671875, -9.7509765625, -8.79931640625, -7.84765625, -6.89599609375, -5.9443359375, -4.99267578125, -4.041015625, -3.08935546875, -2.1376953125, -1.18603515625, -0.234375, 0.71728515625, 1.6689453125, 2.62060546875, 3.572265625, 4.52392578125, 5.4755859375, 6.42724609375, 7.37890625, 8.33056640625, 9.2822265625, 10.23388671875, 11.185546875, 12.13720703125, 13.0888671875, 14.04052734375, 14.9921875, 15.94384765625, 16.8955078125, 17.84716796875, 18.798828125, 19.75048828125, 20.7021484375, 21.65380859375, 22.60546875, 23.55712890625, 24.5087890625, 25.46044921875, 26.412109375, 27.36376953125, 28.3154296875, 29.26708984375, 30.21875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 26.0, 34.0, 68.0, 128.0, 190.0, 204.0, 133.0, 68.0, 56.0, 25.0, 17.0, 15.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.36418151855469, -74.26775360107422, -70.17131805419922, -66.07489013671875, -61.978458404541016, -57.88202667236328, -53.78559875488281, -49.68916702270508, -45.592735290527344, -41.49630355834961, -37.399871826171875, -33.303443908691406, -29.207012176513672, -25.110580444335938, -21.014150619506836, -16.917720794677734, -12.8212890625, -8.724858283996582, -4.628427505493164, -0.5319967269897461, 3.564434051513672, 7.660865783691406, 11.757295608520508, 15.85372543334961, 19.950157165527344, 24.046588897705078, 28.14301872253418, 32.23944854736328, 36.335880279541016, 40.43231201171875, 44.52873992919922, 48.62517166137695, 52.72160339355469, 56.81803512573242, 60.914466857910156, 65.01089477539062, 69.10733032226562, 73.2037582397461, 77.30018615722656, 81.39662170410156, 85.49304962158203, 89.5894775390625, 93.6859130859375, 97.78234100341797, 101.87876892089844, 105.97520446777344, 110.0716323852539, 114.16806030273438, 118.26449584960938, 122.36092376708984, 126.45735931396484, 130.5537872314453, 134.6502227783203, 138.74664306640625, 142.84307861328125, 146.93951416015625, 151.03594970703125, 155.13238525390625, 159.2288055419922, 163.3252410888672, 167.4216766357422, 171.51809692382812, 175.61453247070312, 179.71096801757812, 183.80738830566406]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 9.0, 5.0, 8.0, 13.0, 10.0, 15.0, 13.0, 19.0, 22.0, 21.0, 24.0, 28.0, 51.0, 38.0, 32.0, 39.0, 43.0, 54.0, 48.0, 43.0, 44.0, 51.0, 49.0, 33.0, 28.0, 35.0, 32.0, 24.0, 23.0, 20.0, 17.0, 25.0, 20.0, 17.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.7494125366211, -75.25308990478516, -72.75676727294922, -70.26044464111328, -67.76412200927734, -65.2677993774414, -62.771480560302734, -60.2751579284668, -57.77883529663086, -55.28251266479492, -52.786190032958984, -50.28986740112305, -47.793548583984375, -45.29722595214844, -42.8009033203125, -40.30458068847656, -37.808258056640625, -35.31193542480469, -32.81561279296875, -30.319292068481445, -27.822969436645508, -25.32664680480957, -22.830326080322266, -20.334003448486328, -17.83768081665039, -15.341358184814453, -12.845036506652832, -10.348714828491211, -7.852392196655273, -5.356069564819336, -2.859747886657715, -0.36342620849609375, 2.132904052734375, 4.629226207733154, 7.125548362731934, 9.621870040893555, 12.118192672729492, 14.61451530456543, 17.110836029052734, 19.607158660888672, 22.10348129272461, 24.599803924560547, 27.096126556396484, 29.59244728088379, 32.088768005371094, 34.58509063720703, 37.08141326904297, 39.577735900878906, 42.074058532714844, 44.57038116455078, 47.06670379638672, 49.563026428222656, 52.059349060058594, 54.55567169189453, 57.0519905090332, 59.54831314086914, 62.04463577270508, 64.54095458984375, 67.03727722167969, 69.53359985351562, 72.02992248535156, 74.5262451171875, 77.02256774902344, 79.51889038085938, 82.01521301269531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 6.0, 12.0, 22.0, 20.0, 42.0, 56.0, 89.0, 119.0, 148.0, 227.0, 332.0, 483.0, 707.0, 1091.0, 1575.0, 2533.0, 3892.0, 6016.0, 9637.0, 15729.0, 25848.0, 43997.0, 76285.0, 139091.0, 253598.0, 204781.0, 108949.0, 60888.0, 35645.0, 21217.0, 12990.0, 7984.0, 4994.0, 3230.0, 2090.0, 1364.0, 880.0, 654.0, 417.0, 278.0, 171.0, 150.0, 94.0, 78.0, 54.0, 25.0, 16.0, 15.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.1756591796875, -0.170135498046875, -0.16461181640625, -0.159088134765625, -0.153564453125, -0.148040771484375, -0.14251708984375, -0.136993408203125, -0.1314697265625, -0.125946044921875, -0.12042236328125, -0.114898681640625, -0.109375, -0.103851318359375, -0.09832763671875, -0.092803955078125, -0.0872802734375, -0.081756591796875, -0.07623291015625, -0.070709228515625, -0.065185546875, -0.059661865234375, -0.05413818359375, -0.048614501953125, -0.0430908203125, -0.037567138671875, -0.03204345703125, -0.026519775390625, -0.02099609375, -0.015472412109375, -0.00994873046875, -0.004425048828125, 0.0010986328125, 0.006622314453125, 0.01214599609375, 0.017669677734375, 0.023193359375, 0.028717041015625, 0.03424072265625, 0.039764404296875, 0.0452880859375, 0.050811767578125, 0.05633544921875, 0.061859130859375, 0.0673828125, 0.072906494140625, 0.07843017578125, 0.083953857421875, 0.0894775390625, 0.095001220703125, 0.10052490234375, 0.106048583984375, 0.111572265625, 0.117095947265625, 0.12261962890625, 0.128143310546875, 0.1336669921875, 0.139190673828125, 0.14471435546875, 0.150238037109375, 0.15576171875, 0.161285400390625, 0.16680908203125, 0.172332763671875, 0.1778564453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 9.0, 12.0, 8.0, 9.0, 10.0, 20.0, 25.0, 23.0, 17.0, 20.0, 21.0, 42.0, 33.0, 36.0, 28.0, 23.0, 36.0, 44.0, 45.0, 1068.0, 40.0, 38.0, 45.0, 36.0, 34.0, 37.0, 30.0, 26.0, 25.0, 22.0, 20.0, 15.0, 17.0, 14.0, 15.0, 9.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.966796875, -3.832489013671875, -3.69818115234375, -3.563873291015625, -3.4295654296875, -3.295257568359375, -3.16094970703125, -3.026641845703125, -2.892333984375, -2.758026123046875, -2.62371826171875, -2.489410400390625, -2.3551025390625, -2.220794677734375, -2.08648681640625, -1.952178955078125, -1.81787109375, -1.683563232421875, -1.54925537109375, -1.414947509765625, -1.2806396484375, -1.146331787109375, -1.01202392578125, -0.877716064453125, -0.743408203125, -0.609100341796875, -0.47479248046875, -0.340484619140625, -0.2061767578125, -0.071868896484375, 0.06243896484375, 0.196746826171875, 0.3310546875, 0.465362548828125, 0.59967041015625, 0.733978271484375, 0.8682861328125, 1.002593994140625, 1.13690185546875, 1.271209716796875, 1.405517578125, 1.539825439453125, 1.67413330078125, 1.808441162109375, 1.9427490234375, 2.077056884765625, 2.21136474609375, 2.345672607421875, 2.47998046875, 2.614288330078125, 2.74859619140625, 2.882904052734375, 3.0172119140625, 3.151519775390625, 3.28582763671875, 3.420135498046875, 3.554443359375, 3.688751220703125, 3.82305908203125, 3.957366943359375, 4.0916748046875, 4.225982666015625, 4.36029052734375, 4.494598388671875, 4.62890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 11.0, 21.0, 23.0, 41.0, 50.0, 96.0, 111.0, 176.0, 277.0, 358.0, 588.0, 831.0, 1226.0, 1828.0, 2790.0, 4219.0, 6322.0, 9228.0, 14474.0, 21146.0, 32230.0, 48487.0, 74877.0, 118717.0, 812722.0, 608040.0, 118561.0, 75053.0, 49034.0, 31870.0, 21376.0, 14130.0, 9433.0, 6196.0, 4052.0, 2791.0, 1875.0, 1230.0, 857.0, 595.0, 389.0, 265.0, 173.0, 117.0, 85.0, 53.0, 37.0, 27.0, 14.0, 12.0, 3.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06763076782226562, -0.06537628173828125, -0.06312179565429688, -0.0608673095703125, -0.058612823486328125, -0.05635833740234375, -0.054103851318359375, -0.051849365234375, -0.049594879150390625, -0.04734039306640625, -0.045085906982421875, -0.0428314208984375, -0.040576934814453125, -0.03832244873046875, -0.036067962646484375, -0.0338134765625, -0.031558990478515625, -0.02930450439453125, -0.027050018310546875, -0.0247955322265625, -0.022541046142578125, -0.02028656005859375, -0.018032073974609375, -0.015777587890625, -0.013523101806640625, -0.01126861572265625, -0.009014129638671875, -0.0067596435546875, -0.004505157470703125, -0.00225067138671875, 3.814697265625e-06, 0.00225830078125, 0.004512786865234375, 0.00676727294921875, 0.009021759033203125, 0.0112762451171875, 0.013530731201171875, 0.01578521728515625, 0.018039703369140625, 0.020294189453125, 0.022548675537109375, 0.02480316162109375, 0.027057647705078125, 0.0293121337890625, 0.031566619873046875, 0.03382110595703125, 0.036075592041015625, 0.038330078125, 0.040584564208984375, 0.04283905029296875, 0.045093536376953125, 0.0473480224609375, 0.049602508544921875, 0.05185699462890625, 0.054111480712890625, 0.056365966796875, 0.058620452880859375, 0.06087493896484375, 0.06312942504882812, 0.0653839111328125, 0.06763839721679688, 0.06989288330078125, 0.07214736938476562, 0.07440185546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 19.0, 17.0, 26.0, 30.0, 39.0, 52.0, 54.0, 88.0, 81.0, 71.0, 65.0, 76.0, 77.0, 77.0, 60.0, 43.0, 26.0, 25.0, 17.0, 17.0, 11.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003476142883300781, -0.0003368891775608063, -0.0003261640667915344, -0.0003154389560222626, -0.0003047138452529907, -0.00029398873448371887, -0.000283263623714447, -0.00027253851294517517, -0.0002618134021759033, -0.00025108829140663147, -0.00024036318063735962, -0.00022963806986808777, -0.00021891295909881592, -0.00020818784832954407, -0.00019746273756027222, -0.00018673762679100037, -0.00017601251602172852, -0.00016528740525245667, -0.00015456229448318481, -0.00014383718371391296, -0.0001331120729446411, -0.00012238696217536926, -0.00011166185140609741, -0.00010093674063682556, -9.021162986755371e-05, -7.948651909828186e-05, -6.876140832901001e-05, -5.803629755973816e-05, -4.731118679046631e-05, -3.658607602119446e-05, -2.5860965251922607e-05, -1.5135854482650757e-05, -4.410743713378906e-06, 6.314367055892944e-06, 1.7039477825164795e-05, 2.7764588594436646e-05, 3.8489699363708496e-05, 4.921481013298035e-05, 5.99399209022522e-05, 7.066503167152405e-05, 8.13901424407959e-05, 9.211525321006775e-05, 0.0001028403639793396, 0.00011356547474861145, 0.0001242905855178833, 0.00013501569628715515, 0.000145740807056427, 0.00015646591782569885, 0.0001671910285949707, 0.00017791613936424255, 0.0001886412501335144, 0.00019936636090278625, 0.0002100914716720581, 0.00022081658244132996, 0.0002315416932106018, 0.00024226680397987366, 0.0002529919147491455, 0.00026371702551841736, 0.0002744421362876892, 0.00028516724705696106, 0.0002958923578262329, 0.00030661746859550476, 0.0003173425793647766, 0.00032806769013404846, 0.0003387928009033203]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 39.0, 70.0, 80.0, 125.0, 167.0, 250.0, 350.0, 727.0, 9486.0, 1025911.0, 9432.0, 773.0, 338.0, 215.0, 144.0, 126.0, 76.0, 61.0, 39.0, 35.0, 19.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052642822265625, -0.005097150802612305, -0.004930019378662109, -0.004762887954711914, -0.004595756530761719, -0.0044286251068115234, -0.004261493682861328, -0.004094362258911133, -0.0039272308349609375, -0.003760099411010742, -0.003592967987060547, -0.0034258365631103516, -0.0032587051391601562, -0.003091573715209961, -0.0029244422912597656, -0.0027573108673095703, -0.002590179443359375, -0.0024230480194091797, -0.0022559165954589844, -0.002088785171508789, -0.0019216537475585938, -0.0017545223236083984, -0.0015873908996582031, -0.0014202594757080078, -0.0012531280517578125, -0.0010859966278076172, -0.0009188652038574219, -0.0007517337799072266, -0.0005846023559570312, -0.00041747093200683594, -0.0002503395080566406, -8.320808410644531e-05, 8.392333984375e-05, 0.0002510547637939453, 0.0004181861877441406, 0.0005853176116943359, 0.0007524490356445312, 0.0009195804595947266, 0.0010867118835449219, 0.0012538433074951172, 0.0014209747314453125, 0.0015881061553955078, 0.0017552375793457031, 0.0019223690032958984, 0.0020895004272460938, 0.002256631851196289, 0.0024237632751464844, 0.0025908946990966797, 0.002758026123046875, 0.0029251575469970703, 0.0030922889709472656, 0.003259420394897461, 0.0034265518188476562, 0.0035936832427978516, 0.003760814666748047, 0.003927946090698242, 0.0040950775146484375, 0.004262208938598633, 0.004429340362548828, 0.0045964717864990234, 0.004763603210449219, 0.004930734634399414, 0.005097866058349609, 0.005264997482299805, 0.00543212890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 60.0, 900.0, 51.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.003988742362707853, -0.003920490853488445, -0.0038522391114383936, -0.003783987369388342, -0.003715735860168934, -0.003647484118118882, -0.003579232608899474, -0.0035109808668494225, -0.0034427293576300144, -0.0033744776155799627, -0.0033062261063605547, -0.003237974364310503, -0.003169722855091095, -0.0031014711130410433, -0.0030332196038216352, -0.0029649678617715836, -0.0028967163525521755, -0.002828464610502124, -0.002760213101282716, -0.002691961359232664, -0.002623709850013256, -0.0025554581079632044, -0.0024872065987437963, -0.0024189548566937447, -0.002350703114643693, -0.0022824513725936413, -0.0022141998633742332, -0.0021459481213241816, -0.0020776966121047735, -0.002009444870054722, -0.0019411933608353138, -0.001872941618785262, -0.0018046898767352104, -0.0017364382511004806, -0.0016681866254657507, -0.0015999349998310208, -0.001531683374196291, -0.001463431748561561, -0.0013951801229268312, -0.0013269283808767796, -0.0012586768716573715, -0.0011904252460226417, -0.0011221736203879118, -0.001053921994753182, -0.000985670369118452, -0.0009174187434837222, -0.0008491670596413314, -0.0007809154340066016, -0.0007126637501642108, -0.0006444121245294809, -0.0005761604988947511, -0.0005079088732600212, -0.0004396572185214609, -0.00037140559288673103, -0.0003031539381481707, -0.00023490231251344085, -0.00016665071598254144, -9.839908307185397e-05, -3.014745016116649e-05, 3.81041900254786e-05, 0.00010635581566020846, 0.00017460744129493833, 0.00024285909603349864, 0.0003111107216682285, 0.00037936234730295837]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 5.0, 14.0, 12.0, 18.0, 27.0, 23.0, 20.0, 23.0, 33.0, 45.0, 41.0, 47.0, 43.0, 47.0, 44.0, 50.0, 45.0, 58.0, 44.0, 43.0, 42.0, 38.0, 32.0, 32.0, 25.0, 18.0, 22.0, 21.0, 18.0, 12.0, 10.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001506805419921875, -0.0001443866640329361, -0.0001380927860736847, -0.0001317989081144333, -0.00012550503015518188, -0.00011921115219593048, -0.00011291727423667908, -0.00010662339627742767, -0.00010032951831817627, -9.403564035892487e-05, -8.774176239967346e-05, -8.144788444042206e-05, -7.515400648117065e-05, -6.886012852191925e-05, -6.256625056266785e-05, -5.627237260341644e-05, -4.997849464416504e-05, -4.3684616684913635e-05, -3.739073872566223e-05, -3.109686076641083e-05, -2.4802982807159424e-05, -1.850910484790802e-05, -1.2215226888656616e-05, -5.921348929405212e-06, 3.725290298461914e-07, 6.666406989097595e-06, 1.2960284948348999e-05, 1.9254162907600403e-05, 2.5548040866851807e-05, 3.184191882610321e-05, 3.8135796785354614e-05, 4.442967474460602e-05, 5.072355270385742e-05, 5.7017430663108826e-05, 6.331130862236023e-05, 6.960518658161163e-05, 7.589906454086304e-05, 8.219294250011444e-05, 8.848682045936584e-05, 9.478069841861725e-05, 0.00010107457637786865, 0.00010736845433712006, 0.00011366233229637146, 0.00011995621025562286, 0.00012625008821487427, 0.00013254396617412567, 0.00013883784413337708, 0.00014513172209262848, 0.00015142560005187988, 0.0001577194780111313, 0.0001640133559703827, 0.0001703072339296341, 0.0001766011118888855, 0.0001828949898481369, 0.0001891888678073883, 0.0001954827457666397, 0.0002017766237258911, 0.00020807050168514252, 0.00021436437964439392, 0.00022065825760364532, 0.00022695213556289673, 0.00023324601352214813, 0.00023953989148139954, 0.00024583376944065094, 0.00025212764739990234]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 15.0, 11.0, 22.0, 29.0, 37.0, 62.0, 86.0, 113.0, 164.0, 235.0, 353.0, 473.0, 737.0, 1001.0, 1566.0, 2422.0, 3934.0, 6848.0, 14223.0, 38858.0, 296877.0, 592431.0, 51325.0, 16629.0, 7850.0, 4350.0, 2586.0, 1661.0, 1118.0, 775.0, 544.0, 379.0, 221.0, 199.0, 130.0, 95.0, 50.0, 40.0, 22.0, 21.0, 17.0, 18.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.765625, -17.1943359375, -16.623046875, -16.0517578125, -15.48046875, -14.9091796875, -14.337890625, -13.7666015625, -13.1953125, -12.6240234375, -12.052734375, -11.4814453125, -10.91015625, -10.3388671875, -9.767578125, -9.1962890625, -8.625, -8.0537109375, -7.482421875, -6.9111328125, -6.33984375, -5.7685546875, -5.197265625, -4.6259765625, -4.0546875, -3.4833984375, -2.912109375, -2.3408203125, -1.76953125, -1.1982421875, -0.626953125, -0.0556640625, 0.515625, 1.0869140625, 1.658203125, 2.2294921875, 2.80078125, 3.3720703125, 3.943359375, 4.5146484375, 5.0859375, 5.6572265625, 6.228515625, 6.7998046875, 7.37109375, 7.9423828125, 8.513671875, 9.0849609375, 9.65625, 10.2275390625, 10.798828125, 11.3701171875, 11.94140625, 12.5126953125, 13.083984375, 13.6552734375, 14.2265625, 14.7978515625, 15.369140625, 15.9404296875, 16.51171875, 17.0830078125, 17.654296875, 18.2255859375, 18.796875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 13.0, 17.0, 17.0, 25.0, 12.0, 19.0, 23.0, 26.0, 34.0, 51.0, 56.0, 60.0, 79.0, 154.0, 1537.0, 315.0, 132.0, 67.0, 57.0, 48.0, 30.0, 21.0, 35.0, 38.0, 16.0, 19.0, 12.0, 19.0, 23.0, 14.0, 16.0, 13.0, 6.0, 13.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-31.8125, -30.873046875, -29.93359375, -28.994140625, -28.0546875, -27.115234375, -26.17578125, -25.236328125, -24.296875, -23.357421875, -22.41796875, -21.478515625, -20.5390625, -19.599609375, -18.66015625, -17.720703125, -16.78125, -15.841796875, -14.90234375, -13.962890625, -13.0234375, -12.083984375, -11.14453125, -10.205078125, -9.265625, -8.326171875, -7.38671875, -6.447265625, -5.5078125, -4.568359375, -3.62890625, -2.689453125, -1.75, -0.810546875, 0.12890625, 1.068359375, 2.0078125, 2.947265625, 3.88671875, 4.826171875, 5.765625, 6.705078125, 7.64453125, 8.583984375, 9.5234375, 10.462890625, 11.40234375, 12.341796875, 13.28125, 14.220703125, 15.16015625, 16.099609375, 17.0390625, 17.978515625, 18.91796875, 19.857421875, 20.796875, 21.736328125, 22.67578125, 23.615234375, 24.5546875, 25.494140625, 26.43359375, 27.373046875, 28.3125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 8.0, 13.0, 10.0, 20.0, 9.0, 26.0, 12.0, 22.0, 39.0, 61.0, 77.0, 106.0, 234.0, 533.0, 1433.0, 5015.0, 25698.0, 2263933.0, 821314.0, 20573.0, 4247.0, 1296.0, 489.0, 201.0, 110.0, 57.0, 32.0, 23.0, 17.0, 20.0, 19.0, 15.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.4462890625, -39.048828125, -37.6513671875, -36.25390625, -34.8564453125, -33.458984375, -32.0615234375, -30.6640625, -29.2666015625, -27.869140625, -26.4716796875, -25.07421875, -23.6767578125, -22.279296875, -20.8818359375, -19.484375, -18.0869140625, -16.689453125, -15.2919921875, -13.89453125, -12.4970703125, -11.099609375, -9.7021484375, -8.3046875, -6.9072265625, -5.509765625, -4.1123046875, -2.71484375, -1.3173828125, 0.080078125, 1.4775390625, 2.875, 4.2724609375, 5.669921875, 7.0673828125, 8.46484375, 9.8623046875, 11.259765625, 12.6572265625, 14.0546875, 15.4521484375, 16.849609375, 18.2470703125, 19.64453125, 21.0419921875, 22.439453125, 23.8369140625, 25.234375, 26.6318359375, 28.029296875, 29.4267578125, 30.82421875, 32.2216796875, 33.619140625, 35.0166015625, 36.4140625, 37.8115234375, 39.208984375, 40.6064453125, 42.00390625, 43.4013671875, 44.798828125, 46.1962890625, 47.59375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 15.0, 36.0, 52.0, 68.0, 150.0, 181.0, 196.0, 139.0, 68.0, 40.0, 25.0, 10.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.12922668457031, -69.99588012695312, -67.86253356933594, -65.72918701171875, -63.59584426879883, -61.46249771118164, -59.32915115356445, -57.195804595947266, -55.062461853027344, -52.929115295410156, -50.79576873779297, -48.66242218017578, -46.52907943725586, -44.39573287963867, -42.262386322021484, -40.1290397644043, -37.99569320678711, -35.86234664916992, -33.729000091552734, -31.59565544128418, -29.462310791015625, -27.328964233398438, -25.19561767578125, -23.062271118164062, -20.928926467895508, -18.79557991027832, -16.662235260009766, -14.528888702392578, -12.395543098449707, -10.262197494506836, -8.128850936889648, -5.995505332946777, -3.8621597290039062, -1.728813886642456, 0.40453195571899414, 2.5378780364990234, 4.6712236404418945, 6.804569244384766, 8.937915802001953, 11.071261405944824, 13.204607009887695, 15.337952613830566, 17.471298217773438, 19.604644775390625, 21.737991333007812, 23.871335983276367, 26.004682540893555, 28.13802719116211, 30.271373748779297, 32.404720306396484, 34.53806686401367, 36.671409606933594, 38.80475616455078, 40.93810272216797, 43.071449279785156, 45.204795837402344, 47.33814239501953, 49.47148895263672, 51.604835510253906, 53.738182067871094, 55.871524810791016, 58.0048713684082, 60.13821792602539, 62.27156448364258, 64.4049072265625]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 17.0, 18.0, 18.0, 21.0, 30.0, 29.0, 28.0, 39.0, 29.0, 51.0, 33.0, 37.0, 29.0, 30.0, 46.0, 42.0, 40.0, 36.0, 28.0, 34.0, 27.0, 45.0, 19.0, 29.0, 24.0, 21.0, 23.0, 17.0, 15.0, 10.0, 9.0, 16.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.57829284667969, -83.71070861816406, -80.84313201904297, -77.97555541992188, -75.10797119140625, -72.24038696289062, -69.37281036376953, -66.50523376464844, -63.63764953613281, -60.77006912231445, -57.902488708496094, -55.034908294677734, -52.167327880859375, -49.299747467041016, -46.432167053222656, -43.5645866394043, -40.69700622558594, -37.82942581176758, -34.96184539794922, -32.09426498413086, -29.2266845703125, -26.35910415649414, -23.49152374267578, -20.623943328857422, -17.756362915039062, -14.888782501220703, -12.021202087402344, -9.153621673583984, -6.286041259765625, -3.4184608459472656, -0.5508804321289062, 2.316699981689453, 5.184288024902344, 8.051868438720703, 10.919448852539062, 13.787029266357422, 16.65460968017578, 19.52219009399414, 22.3897705078125, 25.25735092163086, 28.12493133544922, 30.992511749267578, 33.86009216308594, 36.7276725769043, 39.595252990722656, 42.462833404541016, 45.330413818359375, 48.197994232177734, 51.065574645996094, 53.93315505981445, 56.80073547363281, 59.66831588745117, 62.53589630126953, 65.40347290039062, 68.27105712890625, 71.13864135742188, 74.00621795654297, 76.87379455566406, 79.74137878417969, 82.60896301269531, 85.4765396118164, 88.3441162109375, 91.21170043945312, 94.07928466796875, 96.94686126708984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 8.0, 15.0, 9.0, 16.0, 22.0, 11.0, 16.0, 34.0, 28.0, 29.0, 39.0, 33.0, 34.0, 40.0, 47.0, 56.0, 47.0, 54.0, 53.0, 41.0, 48.0, 41.0, 39.0, 39.0, 31.0, 21.0, 22.0, 15.0, 15.0, 13.0, 20.0, 9.0, 8.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.21875, -8.94580078125, -8.6728515625, -8.39990234375, -8.126953125, -7.85400390625, -7.5810546875, -7.30810546875, -7.03515625, -6.76220703125, -6.4892578125, -6.21630859375, -5.943359375, -5.67041015625, -5.3974609375, -5.12451171875, -4.8515625, -4.57861328125, -4.3056640625, -4.03271484375, -3.759765625, -3.48681640625, -3.2138671875, -2.94091796875, -2.66796875, -2.39501953125, -2.1220703125, -1.84912109375, -1.576171875, -1.30322265625, -1.0302734375, -0.75732421875, -0.484375, -0.21142578125, 0.0615234375, 0.33447265625, 0.607421875, 0.88037109375, 1.1533203125, 1.42626953125, 1.69921875, 1.97216796875, 2.2451171875, 2.51806640625, 2.791015625, 3.06396484375, 3.3369140625, 3.60986328125, 3.8828125, 4.15576171875, 4.4287109375, 4.70166015625, 4.974609375, 5.24755859375, 5.5205078125, 5.79345703125, 6.06640625, 6.33935546875, 6.6123046875, 6.88525390625, 7.158203125, 7.43115234375, 7.7041015625, 7.97705078125, 8.25]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 12.0, 14.0, 13.0, 11.0, 19.0, 33.0, 47.0, 62.0, 95.0, 136.0, 200.0, 272.0, 396.0, 711.0, 1036.0, 1809.0, 3270.0, 6465.0, 15968.0, 155846.0, 2938556.0, 996271.0, 51313.0, 10378.0, 4830.0, 2582.0, 1520.0, 880.0, 536.0, 319.0, 218.0, 129.0, 95.0, 76.0, 40.0, 32.0, 30.0, 10.0, 8.0, 11.0, 10.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.140625, -26.33740234375, -25.5341796875, -24.73095703125, -23.927734375, -23.12451171875, -22.3212890625, -21.51806640625, -20.71484375, -19.91162109375, -19.1083984375, -18.30517578125, -17.501953125, -16.69873046875, -15.8955078125, -15.09228515625, -14.2890625, -13.48583984375, -12.6826171875, -11.87939453125, -11.076171875, -10.27294921875, -9.4697265625, -8.66650390625, -7.86328125, -7.06005859375, -6.2568359375, -5.45361328125, -4.650390625, -3.84716796875, -3.0439453125, -2.24072265625, -1.4375, -0.63427734375, 0.1689453125, 0.97216796875, 1.775390625, 2.57861328125, 3.3818359375, 4.18505859375, 4.98828125, 5.79150390625, 6.5947265625, 7.39794921875, 8.201171875, 9.00439453125, 9.8076171875, 10.61083984375, 11.4140625, 12.21728515625, 13.0205078125, 13.82373046875, 14.626953125, 15.43017578125, 16.2333984375, 17.03662109375, 17.83984375, 18.64306640625, 19.4462890625, 20.24951171875, 21.052734375, 21.85595703125, 22.6591796875, 23.46240234375, 24.265625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 7.0, 18.0, 31.0, 33.0, 43.0, 71.0, 109.0, 229.0, 532.0, 972.0, 972.0, 484.0, 200.0, 110.0, 71.0, 42.0, 26.0, 19.0, 18.0, 18.0, 9.0, 7.0, 7.0, 8.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.21875, -27.27685546875, -26.3349609375, -25.39306640625, -24.451171875, -23.50927734375, -22.5673828125, -21.62548828125, -20.68359375, -19.74169921875, -18.7998046875, -17.85791015625, -16.916015625, -15.97412109375, -15.0322265625, -14.09033203125, -13.1484375, -12.20654296875, -11.2646484375, -10.32275390625, -9.380859375, -8.43896484375, -7.4970703125, -6.55517578125, -5.61328125, -4.67138671875, -3.7294921875, -2.78759765625, -1.845703125, -0.90380859375, 0.0380859375, 0.97998046875, 1.921875, 2.86376953125, 3.8056640625, 4.74755859375, 5.689453125, 6.63134765625, 7.5732421875, 8.51513671875, 9.45703125, 10.39892578125, 11.3408203125, 12.28271484375, 13.224609375, 14.16650390625, 15.1083984375, 16.05029296875, 16.9921875, 17.93408203125, 18.8759765625, 19.81787109375, 20.759765625, 21.70166015625, 22.6435546875, 23.58544921875, 24.52734375, 25.46923828125, 26.4111328125, 27.35302734375, 28.294921875, 29.23681640625, 30.1787109375, 31.12060546875, 32.0625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 13.0, 18.0, 31.0, 38.0, 56.0, 89.0, 158.0, 240.0, 439.0, 845.0, 1727.0, 4080.0, 10167.0, 34134.0, 247548.0, 3588725.0, 253167.0, 34632.0, 10528.0, 3981.0, 1755.0, 772.0, 449.0, 293.0, 137.0, 102.0, 49.0, 32.0, 13.0, 14.0, 7.0, 5.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.78125, -40.5341796875, -39.287109375, -38.0400390625, -36.79296875, -35.5458984375, -34.298828125, -33.0517578125, -31.8046875, -30.5576171875, -29.310546875, -28.0634765625, -26.81640625, -25.5693359375, -24.322265625, -23.0751953125, -21.828125, -20.5810546875, -19.333984375, -18.0869140625, -16.83984375, -15.5927734375, -14.345703125, -13.0986328125, -11.8515625, -10.6044921875, -9.357421875, -8.1103515625, -6.86328125, -5.6162109375, -4.369140625, -3.1220703125, -1.875, -0.6279296875, 0.619140625, 1.8662109375, 3.11328125, 4.3603515625, 5.607421875, 6.8544921875, 8.1015625, 9.3486328125, 10.595703125, 11.8427734375, 13.08984375, 14.3369140625, 15.583984375, 16.8310546875, 18.078125, 19.3251953125, 20.572265625, 21.8193359375, 23.06640625, 24.3134765625, 25.560546875, 26.8076171875, 28.0546875, 29.3017578125, 30.548828125, 31.7958984375, 33.04296875, 34.2900390625, 35.537109375, 36.7841796875, 38.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 12.0, 9.0, 22.0, 41.0, 58.0, 88.0, 121.0, 166.0, 130.0, 108.0, 70.0, 56.0, 34.0, 19.0, 18.0, 11.0, 8.0, 3.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-98.1707992553711, -95.26211547851562, -92.35343170166016, -89.44474792480469, -86.53606414794922, -83.62738037109375, -80.71870422363281, -77.81002044677734, -74.90133666992188, -71.9926528930664, -69.08396911621094, -66.17528533935547, -63.266605377197266, -60.3579216003418, -57.44923782348633, -54.540557861328125, -51.63187026977539, -48.72318649291992, -45.81450271606445, -42.90582275390625, -39.99713897705078, -37.08845520019531, -34.179771423339844, -31.271089553833008, -28.36240577697754, -25.45372200012207, -22.545040130615234, -19.636356353759766, -16.727672576904297, -13.818990707397461, -10.910306930541992, -8.001625061035156, -5.0929412841796875, -2.184258222579956, 0.7244248390197754, 3.633108139038086, 6.541790962219238, 9.45047378540039, 12.35915756225586, 15.267839431762695, 18.176523208618164, 21.085206985473633, 23.99388885498047, 26.902572631835938, 29.811256408691406, 32.719940185546875, 35.628623962402344, 38.53730392456055, 41.445987701416016, 44.354671478271484, 47.26335525512695, 50.172035217285156, 53.080718994140625, 55.989402770996094, 58.89808654785156, 61.80677032470703, 64.7154541015625, 67.62413787841797, 70.53282165527344, 73.4415054321289, 76.35018920898438, 79.25886535644531, 82.16755676269531, 85.07623291015625, 87.98491668701172]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 5.0, 12.0, 7.0, 15.0, 14.0, 15.0, 21.0, 19.0, 30.0, 23.0, 18.0, 33.0, 31.0, 23.0, 27.0, 34.0, 42.0, 41.0, 59.0, 40.0, 34.0, 35.0, 42.0, 40.0, 34.0, 27.0, 32.0, 27.0, 28.0, 30.0, 26.0, 13.0, 15.0, 10.0, 11.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-57.083038330078125, -55.23347091674805, -53.38390350341797, -51.53433609008789, -49.68476867675781, -47.835201263427734, -45.985633850097656, -44.13606643676758, -42.2864990234375, -40.43693161010742, -38.587364196777344, -36.737796783447266, -34.88822937011719, -33.03866195678711, -31.18909454345703, -29.339527130126953, -27.489959716796875, -25.640392303466797, -23.79082489013672, -21.94125747680664, -20.091690063476562, -18.242122650146484, -16.392555236816406, -14.542987823486328, -12.69342041015625, -10.843852996826172, -8.994285583496094, -7.144718170166016, -5.2951507568359375, -3.4455833435058594, -1.5960159301757812, 0.2535514831542969, 2.103118896484375, 3.952686309814453, 5.802253723144531, 7.651821136474609, 9.501388549804688, 11.350955963134766, 13.200523376464844, 15.050090789794922, 16.899658203125, 18.749225616455078, 20.598793029785156, 22.448360443115234, 24.297927856445312, 26.14749526977539, 27.99706268310547, 29.846630096435547, 31.696197509765625, 33.5457649230957, 35.39533233642578, 37.24489974975586, 39.09446716308594, 40.944034576416016, 42.793601989746094, 44.64316940307617, 46.49273681640625, 48.34230422973633, 50.191871643066406, 52.041439056396484, 53.89100646972656, 55.74057388305664, 57.59014129638672, 59.4397087097168, 61.289276123046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 14.0, 23.0, 37.0, 53.0, 62.0, 98.0, 184.0, 288.0, 404.0, 588.0, 923.0, 1443.0, 2385.0, 3636.0, 5755.0, 9205.0, 14914.0, 24916.0, 42030.0, 72262.0, 126349.0, 231862.0, 219852.0, 119918.0, 69119.0, 39985.0, 24009.0, 14231.0, 8772.0, 5536.0, 3443.0, 2188.0, 1465.0, 862.0, 606.0, 399.0, 257.0, 146.0, 109.0, 75.0, 50.0, 24.0, 20.0, 13.0, 15.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.2003173828125, -0.19441795349121094, -0.18851852416992188, -0.1826190948486328, -0.17671966552734375, -0.1708202362060547, -0.16492080688476562, -0.15902137756347656, -0.1531219482421875, -0.14722251892089844, -0.14132308959960938, -0.1354236602783203, -0.12952423095703125, -0.12362480163574219, -0.11772537231445312, -0.11182594299316406, -0.105926513671875, -0.10002708435058594, -0.09412765502929688, -0.08822822570800781, -0.08232879638671875, -0.07642936706542969, -0.07052993774414062, -0.06463050842285156, -0.0587310791015625, -0.05283164978027344, -0.046932220458984375, -0.04103279113769531, -0.03513336181640625, -0.029233932495117188, -0.023334503173828125, -0.017435073852539062, -0.01153564453125, -0.0056362152099609375, 0.000263214111328125, 0.0061626434326171875, 0.01206207275390625, 0.017961502075195312, 0.023860931396484375, 0.029760360717773438, 0.0356597900390625, 0.04155921936035156, 0.047458648681640625, 0.05335807800292969, 0.05925750732421875, 0.06515693664550781, 0.07105636596679688, 0.07695579528808594, 0.082855224609375, 0.08875465393066406, 0.09465408325195312, 0.10055351257324219, 0.10645294189453125, 0.11235237121582031, 0.11825180053710938, 0.12415122985839844, 0.1300506591796875, 0.13595008850097656, 0.14184951782226562, 0.1477489471435547, 0.15364837646484375, 0.1595478057861328, 0.16544723510742188, 0.17134666442871094, 0.17724609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 10.0, 10.0, 10.0, 12.0, 11.0, 15.0, 23.0, 22.0, 20.0, 22.0, 32.0, 33.0, 35.0, 36.0, 33.0, 30.0, 45.0, 35.0, 33.0, 1061.0, 36.0, 48.0, 35.0, 38.0, 35.0, 35.0, 27.0, 31.0, 23.0, 25.0, 19.0, 26.0, 20.0, 20.0, 9.0, 5.0, 9.0, 9.0, 6.0, 4.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.13043212890625, -3.9835205078125, -3.83660888671875, -3.689697265625, -3.54278564453125, -3.3958740234375, -3.24896240234375, -3.10205078125, -2.95513916015625, -2.8082275390625, -2.66131591796875, -2.514404296875, -2.36749267578125, -2.2205810546875, -2.07366943359375, -1.9267578125, -1.77984619140625, -1.6329345703125, -1.48602294921875, -1.339111328125, -1.19219970703125, -1.0452880859375, -0.89837646484375, -0.75146484375, -0.60455322265625, -0.4576416015625, -0.31072998046875, -0.163818359375, -0.01690673828125, 0.1300048828125, 0.27691650390625, 0.423828125, 0.57073974609375, 0.7176513671875, 0.86456298828125, 1.011474609375, 1.15838623046875, 1.3052978515625, 1.45220947265625, 1.59912109375, 1.74603271484375, 1.8929443359375, 2.03985595703125, 2.186767578125, 2.33367919921875, 2.4805908203125, 2.62750244140625, 2.7744140625, 2.92132568359375, 3.0682373046875, 3.21514892578125, 3.362060546875, 3.50897216796875, 3.6558837890625, 3.80279541015625, 3.94970703125, 4.09661865234375, 4.2435302734375, 4.39044189453125, 4.537353515625, 4.68426513671875, 4.8311767578125, 4.97808837890625, 5.125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 13.0, 18.0, 26.0, 25.0, 60.0, 78.0, 111.0, 164.0, 264.0, 365.0, 504.0, 735.0, 1056.0, 1402.0, 2032.0, 3114.0, 4511.0, 6592.0, 9780.0, 14151.0, 20706.0, 30248.0, 45080.0, 67141.0, 100897.0, 152353.0, 1234573.0, 132065.0, 87679.0, 58175.0, 38976.0, 26663.0, 18272.0, 12224.0, 8459.0, 5728.0, 4027.0, 2795.0, 1886.0, 1312.0, 866.0, 627.0, 429.0, 303.0, 210.0, 138.0, 104.0, 60.0, 50.0, 40.0, 17.0, 12.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.06927490234375, -0.0670633316040039, -0.06485176086425781, -0.06264019012451172, -0.060428619384765625, -0.05821704864501953, -0.05600547790527344, -0.053793907165527344, -0.05158233642578125, -0.049370765686035156, -0.04715919494628906, -0.04494762420654297, -0.042736053466796875, -0.04052448272705078, -0.03831291198730469, -0.036101341247558594, -0.0338897705078125, -0.031678199768066406, -0.029466629028320312, -0.02725505828857422, -0.025043487548828125, -0.02283191680908203, -0.020620346069335938, -0.018408775329589844, -0.01619720458984375, -0.013985633850097656, -0.011774063110351562, -0.009562492370605469, -0.007350921630859375, -0.005139350891113281, -0.0029277801513671875, -0.0007162094116210938, 0.001495361328125, 0.0037069320678710938, 0.0059185028076171875, 0.008130073547363281, 0.010341644287109375, 0.012553215026855469, 0.014764785766601562, 0.016976356506347656, 0.01918792724609375, 0.021399497985839844, 0.023611068725585938, 0.02582263946533203, 0.028034210205078125, 0.03024578094482422, 0.03245735168457031, 0.034668922424316406, 0.0368804931640625, 0.039092063903808594, 0.04130363464355469, 0.04351520538330078, 0.045726776123046875, 0.04793834686279297, 0.05014991760253906, 0.052361488342285156, 0.05457305908203125, 0.056784629821777344, 0.05899620056152344, 0.06120777130126953, 0.06341934204101562, 0.06563091278076172, 0.06784248352050781, 0.0700540542602539, 0.072265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 9.0, 10.0, 9.0, 14.0, 24.0, 33.0, 35.0, 44.0, 40.0, 46.0, 63.0, 65.0, 56.0, 62.0, 55.0, 50.0, 51.0, 58.0, 54.0, 35.0, 31.0, 29.0, 23.0, 20.0, 17.0, 16.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.00029597803950309753, -0.0002858266234397888, -0.0002756752073764801, -0.0002655237913131714, -0.00025537237524986267, -0.00024522095918655396, -0.00023506954312324524, -0.00022491812705993652, -0.0002147667109966278, -0.0002046152949333191, -0.00019446387887001038, -0.00018431246280670166, -0.00017416104674339294, -0.00016400963068008423, -0.0001538582146167755, -0.0001437067985534668, -0.00013355538249015808, -0.00012340396642684937, -0.00011325255036354065, -0.00010310113430023193, -9.294971823692322e-05, -8.27983021736145e-05, -7.264688611030579e-05, -6.249547004699707e-05, -5.2344053983688354e-05, -4.219263792037964e-05, -3.204122185707092e-05, -2.1889805793762207e-05, -1.1738389730453491e-05, -1.5869736671447754e-06, 8.56444239616394e-06, 1.8715858459472656e-05, 2.8867274522781372e-05, 3.901869058609009e-05, 4.9170106649398804e-05, 5.932152271270752e-05, 6.947293877601624e-05, 7.962435483932495e-05, 8.977577090263367e-05, 9.992718696594238e-05, 0.0001100786030292511, 0.00012023001909255981, 0.00013038143515586853, 0.00014053285121917725, 0.00015068426728248596, 0.00016083568334579468, 0.0001709870994091034, 0.0001811385154724121, 0.00019128993153572083, 0.00020144134759902954, 0.00021159276366233826, 0.00022174417972564697, 0.0002318955957889557, 0.0002420470118522644, 0.0002521984279155731, 0.00026234984397888184, 0.00027250126004219055, 0.00028265267610549927, 0.000292804092168808, 0.0003029555082321167, 0.0003131069242954254, 0.00032325834035873413, 0.00033340975642204285, 0.00034356117248535156]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 13.0, 15.0, 30.0, 41.0, 53.0, 66.0, 80.0, 137.0, 179.0, 239.0, 325.0, 660.0, 6876.0, 1008033.0, 29512.0, 853.0, 404.0, 260.0, 190.0, 162.0, 105.0, 90.0, 64.0, 33.0, 32.0, 22.0, 19.0, 11.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00583648681640625, -0.005662977695465088, -0.005489468574523926, -0.005315959453582764, -0.0051424503326416016, -0.0049689412117004395, -0.004795432090759277, -0.004621922969818115, -0.004448413848876953, -0.004274904727935791, -0.004101395606994629, -0.003927886486053467, -0.0037543773651123047, -0.0035808682441711426, -0.0034073591232299805, -0.0032338500022888184, -0.0030603408813476562, -0.002886831760406494, -0.002713322639465332, -0.00253981351852417, -0.002366304397583008, -0.0021927952766418457, -0.0020192861557006836, -0.0018457770347595215, -0.0016722679138183594, -0.0014987587928771973, -0.0013252496719360352, -0.001151740550994873, -0.000978231430053711, -0.0008047223091125488, -0.0006312131881713867, -0.0004577040672302246, -0.0002841949462890625, -0.00011068582534790039, 6.282329559326172e-05, 0.00023633241653442383, 0.00040984153747558594, 0.000583350658416748, 0.0007568597793579102, 0.0009303689002990723, 0.0011038780212402344, 0.0012773871421813965, 0.0014508962631225586, 0.0016244053840637207, 0.0017979145050048828, 0.001971423625946045, 0.002144932746887207, 0.002318441867828369, 0.0024919509887695312, 0.0026654601097106934, 0.0028389692306518555, 0.0030124783515930176, 0.0031859874725341797, 0.003359496593475342, 0.003533005714416504, 0.003706514835357666, 0.003880023956298828, 0.00405353307723999, 0.004227042198181152, 0.0044005513191223145, 0.0045740604400634766, 0.004747569561004639, 0.004921078681945801, 0.005094587802886963, 0.005268096923828125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 24.0, 515.0, 450.0, 22.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032828235998749733, -0.0032251852098852396, -0.003167546819895506, -0.0031099081970751286, -0.003052269807085395, -0.002994631417095661, -0.0029369930271059275, -0.0028793546371161938, -0.00282171624712646, -0.0027640778571367264, -0.0027064394671469927, -0.002648801077157259, -0.0025911624543368816, -0.002533524064347148, -0.0024758856743574142, -0.0024182472843676805, -0.002360608661547303, -0.0023029702715575695, -0.002245331881567836, -0.002187693491578102, -0.0021300548687577248, -0.002072416478767991, -0.0020147780887782574, -0.0019571396987885237, -0.00189950130879879, -0.0018418629188090563, -0.0017842244124040008, -0.001726586022414267, -0.0016689476324245334, -0.0016113091260194778, -0.0015536707360297441, -0.0014960323460400105, -0.0014383939560502768, -0.001380755566060543, -0.0013231170596554875, -0.0012654786696657538, -0.0012078402796760201, -0.0011502017732709646, -0.001092563383281231, -0.0010349249932914972, -0.0009772864868864417, -0.0009196480386890471, -0.0008620096486993134, -0.0008043712005019188, -0.0007467327523045242, -0.0006890943041071296, -0.0006314559141173959, -0.0005738174659200013, -0.0005161790177226067, -0.0004585405986290425, -0.0004009021504316479, -0.00034326373133808374, -0.00028562528314068913, -0.00022798686404712498, -0.00017034844495356083, -0.00011270999675616622, -5.507157766260207e-05, 2.566852344898507e-06, 6.020528235239908e-05, 0.00011784370872192085, 0.00017548214236740023, 0.0002331205760128796, 0.00029075899510644376, 0.00034839744330383837, 0.0004060358623974025]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 10.0, 24.0, 20.0, 20.0, 23.0, 30.0, 31.0, 33.0, 27.0, 49.0, 46.0, 41.0, 59.0, 48.0, 40.0, 48.0, 42.0, 41.0, 44.0, 32.0, 38.0, 27.0, 32.0, 26.0, 31.0, 21.0, 16.0, 14.0, 12.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0002675056457519531, -0.0002597291022539139, -0.00025195255875587463, -0.0002441760152578354, -0.00023639947175979614, -0.0002286229282617569, -0.00022084638476371765, -0.0002130698412656784, -0.00020529329776763916, -0.00019751675426959991, -0.00018974021077156067, -0.00018196366727352142, -0.00017418712377548218, -0.00016641058027744293, -0.0001586340367794037, -0.00015085749328136444, -0.0001430809497833252, -0.00013530440628528595, -0.0001275278627872467, -0.00011975131928920746, -0.00011197477579116821, -0.00010419823229312897, -9.642168879508972e-05, -8.864514529705048e-05, -8.086860179901123e-05, -7.309205830097198e-05, -6.531551480293274e-05, -5.7538971304893494e-05, -4.976242780685425e-05, -4.1985884308815e-05, -3.420934081077576e-05, -2.643279731273651e-05, -1.8656253814697266e-05, -1.087971031665802e-05, -3.1031668186187744e-06, 4.673376679420471e-06, 1.2449920177459717e-05, 2.0226463675498962e-05, 2.8003007173538208e-05, 3.5779550671577454e-05, 4.35560941696167e-05, 5.1332637667655945e-05, 5.910918116569519e-05, 6.688572466373444e-05, 7.466226816177368e-05, 8.243881165981293e-05, 9.021535515785217e-05, 9.799189865589142e-05, 0.00010576844215393066, 0.00011354498565196991, 0.00012132152915000916, 0.0001290980726480484, 0.00013687461614608765, 0.0001446511596441269, 0.00015242770314216614, 0.00016020424664020538, 0.00016798079013824463, 0.00017575733363628387, 0.00018353387713432312, 0.00019131042063236237, 0.0001990869641304016, 0.00020686350762844086, 0.0002146400511264801, 0.00022241659462451935, 0.0002301931381225586]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 11.0, 12.0, 6.0, 23.0, 18.0, 25.0, 27.0, 39.0, 51.0, 67.0, 114.0, 170.0, 277.0, 453.0, 729.0, 1187.0, 2020.0, 3901.0, 8089.0, 22896.0, 163588.0, 771201.0, 48504.0, 12944.0, 5415.0, 2725.0, 1526.0, 908.0, 564.0, 344.0, 219.0, 153.0, 101.0, 71.0, 45.0, 38.0, 23.0, 10.0, 12.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.96875, -25.080810546875, -24.19287109375, -23.304931640625, -22.4169921875, -21.529052734375, -20.64111328125, -19.753173828125, -18.865234375, -17.977294921875, -17.08935546875, -16.201416015625, -15.3134765625, -14.425537109375, -13.53759765625, -12.649658203125, -11.76171875, -10.873779296875, -9.98583984375, -9.097900390625, -8.2099609375, -7.322021484375, -6.43408203125, -5.546142578125, -4.658203125, -3.770263671875, -2.88232421875, -1.994384765625, -1.1064453125, -0.218505859375, 0.66943359375, 1.557373046875, 2.4453125, 3.333251953125, 4.22119140625, 5.109130859375, 5.9970703125, 6.885009765625, 7.77294921875, 8.660888671875, 9.548828125, 10.436767578125, 11.32470703125, 12.212646484375, 13.1005859375, 13.988525390625, 14.87646484375, 15.764404296875, 16.65234375, 17.540283203125, 18.42822265625, 19.316162109375, 20.2041015625, 21.092041015625, 21.97998046875, 22.867919921875, 23.755859375, 24.643798828125, 25.53173828125, 26.419677734375, 27.3076171875, 28.195556640625, 29.08349609375, 29.971435546875, 30.859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 15.0, 19.0, 21.0, 28.0, 33.0, 38.0, 44.0, 38.0, 34.0, 54.0, 86.0, 147.0, 1565.0, 315.0, 114.0, 68.0, 53.0, 32.0, 45.0, 28.0, 35.0, 36.0, 27.0, 18.0, 23.0, 22.0, 12.0, 6.0, 16.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-28.5625, -27.63525390625, -26.7080078125, -25.78076171875, -24.853515625, -23.92626953125, -22.9990234375, -22.07177734375, -21.14453125, -20.21728515625, -19.2900390625, -18.36279296875, -17.435546875, -16.50830078125, -15.5810546875, -14.65380859375, -13.7265625, -12.79931640625, -11.8720703125, -10.94482421875, -10.017578125, -9.09033203125, -8.1630859375, -7.23583984375, -6.30859375, -5.38134765625, -4.4541015625, -3.52685546875, -2.599609375, -1.67236328125, -0.7451171875, 0.18212890625, 1.109375, 2.03662109375, 2.9638671875, 3.89111328125, 4.818359375, 5.74560546875, 6.6728515625, 7.60009765625, 8.52734375, 9.45458984375, 10.3818359375, 11.30908203125, 12.236328125, 13.16357421875, 14.0908203125, 15.01806640625, 15.9453125, 16.87255859375, 17.7998046875, 18.72705078125, 19.654296875, 20.58154296875, 21.5087890625, 22.43603515625, 23.36328125, 24.29052734375, 25.2177734375, 26.14501953125, 27.072265625, 27.99951171875, 28.9267578125, 29.85400390625, 30.78125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 11.0, 5.0, 11.0, 18.0, 30.0, 32.0, 38.0, 58.0, 85.0, 129.0, 235.0, 521.0, 1173.0, 3109.0, 10721.0, 75919.0, 2939636.0, 96013.0, 12091.0, 3410.0, 1270.0, 506.0, 249.0, 133.0, 77.0, 61.0, 45.0, 27.0, 19.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.53125, -48.09716796875, -46.6630859375, -45.22900390625, -43.794921875, -42.36083984375, -40.9267578125, -39.49267578125, -38.05859375, -36.62451171875, -35.1904296875, -33.75634765625, -32.322265625, -30.88818359375, -29.4541015625, -28.02001953125, -26.5859375, -25.15185546875, -23.7177734375, -22.28369140625, -20.849609375, -19.41552734375, -17.9814453125, -16.54736328125, -15.11328125, -13.67919921875, -12.2451171875, -10.81103515625, -9.376953125, -7.94287109375, -6.5087890625, -5.07470703125, -3.640625, -2.20654296875, -0.7724609375, 0.66162109375, 2.095703125, 3.52978515625, 4.9638671875, 6.39794921875, 7.83203125, 9.26611328125, 10.7001953125, 12.13427734375, 13.568359375, 15.00244140625, 16.4365234375, 17.87060546875, 19.3046875, 20.73876953125, 22.1728515625, 23.60693359375, 25.041015625, 26.47509765625, 27.9091796875, 29.34326171875, 30.77734375, 32.21142578125, 33.6455078125, 35.07958984375, 36.513671875, 37.94775390625, 39.3818359375, 40.81591796875, 42.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 153.0, 563.0, 222.0, 39.0, 10.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.226104736328125, -21.176929473876953, -13.127754211425781, -5.078578948974609, 2.9705963134765625, 11.019771575927734, 19.068946838378906, 27.118122100830078, 35.16729736328125, 43.21647262573242, 51.265647888183594, 59.314823150634766, 67.36399841308594, 75.41317749023438, 83.46234893798828, 91.51152038574219, 99.56069946289062, 107.60987854003906, 115.65904998779297, 123.70822143554688, 131.7574005126953, 139.80657958984375, 147.85574340820312, 155.90492248535156, 163.9541015625, 172.00328063964844, 180.05245971679688, 188.10162353515625, 196.1508026123047, 204.19998168945312, 212.2491455078125, 220.29832458496094, 228.3475341796875, 236.39671325683594, 244.44589233398438, 252.49505615234375, 260.54425048828125, 268.5934143066406, 276.642578125, 284.6917724609375, 292.7409362792969, 300.79010009765625, 308.83929443359375, 316.8884582519531, 324.9376220703125, 332.98681640625, 341.0359802246094, 349.0851745605469, 357.13433837890625, 365.1835021972656, 373.2326965332031, 381.2818603515625, 389.3310546875, 397.3802185058594, 405.42938232421875, 413.47857666015625, 421.5277404785156, 429.576904296875, 437.6260986328125, 445.6752624511719, 453.72442626953125, 461.77362060546875, 469.8227844238281, 477.8719787597656, 485.921142578125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 9.0, 16.0, 7.0, 17.0, 14.0, 20.0, 29.0, 26.0, 28.0, 27.0, 22.0, 40.0, 33.0, 33.0, 43.0, 35.0, 41.0, 43.0, 44.0, 50.0, 40.0, 40.0, 37.0, 36.0, 37.0, 34.0, 36.0, 33.0, 12.0, 17.0, 13.0, 14.0, 11.0, 16.0, 4.0, 11.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.70098876953125, -87.95838928222656, -85.21578979492188, -82.47319030761719, -79.7305908203125, -76.98799133300781, -74.24539184570312, -71.5027847290039, -68.76018524169922, -66.01758575439453, -63.274986267089844, -60.532386779785156, -57.7897834777832, -55.047183990478516, -52.30458450317383, -49.561981201171875, -46.81938552856445, -44.076786041259766, -41.33418655395508, -38.591583251953125, -35.84898376464844, -33.10638427734375, -30.363784790039062, -27.621183395385742, -24.878583908081055, -22.135984420776367, -19.393383026123047, -16.65078353881836, -13.908183097839355, -11.165582656860352, -8.422983169555664, -5.680381774902344, -2.9377822875976562, -0.19518208503723145, 2.5474181175231934, 5.290018081665039, 8.032618522644043, 10.775218963623047, 13.517818450927734, 16.260419845581055, 19.003019332885742, 21.74561882019043, 24.48822021484375, 27.230819702148438, 29.973419189453125, 32.71601867675781, 35.4586181640625, 38.20122146606445, 40.94382095336914, 43.68642044067383, 46.429019927978516, 49.17162322998047, 51.914222717285156, 54.656822204589844, 57.39942169189453, 60.14202117919922, 62.884620666503906, 65.6272201538086, 68.36981964111328, 71.11241912841797, 73.85501861572266, 76.59762573242188, 79.34022521972656, 82.08282470703125, 84.82542419433594]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 11.0, 13.0, 14.0, 33.0, 19.0, 19.0, 30.0, 31.0, 36.0, 46.0, 32.0, 47.0, 39.0, 43.0, 56.0, 55.0, 42.0, 48.0, 45.0, 36.0, 39.0, 35.0, 29.0, 29.0, 23.0, 18.0, 15.0, 20.0, 8.0, 12.0, 8.0, 6.0, 3.0, 12.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.9921875, -9.7122802734375, -9.432373046875, -9.1524658203125, -8.87255859375, -8.5926513671875, -8.312744140625, -8.0328369140625, -7.7529296875, -7.4730224609375, -7.193115234375, -6.9132080078125, -6.63330078125, -6.3533935546875, -6.073486328125, -5.7935791015625, -5.513671875, -5.2337646484375, -4.953857421875, -4.6739501953125, -4.39404296875, -4.1141357421875, -3.834228515625, -3.5543212890625, -3.2744140625, -2.9945068359375, -2.714599609375, -2.4346923828125, -2.15478515625, -1.8748779296875, -1.594970703125, -1.3150634765625, -1.03515625, -0.7552490234375, -0.475341796875, -0.1954345703125, 0.08447265625, 0.3643798828125, 0.644287109375, 0.9241943359375, 1.2041015625, 1.4840087890625, 1.763916015625, 2.0438232421875, 2.32373046875, 2.6036376953125, 2.883544921875, 3.1634521484375, 3.443359375, 3.7232666015625, 4.003173828125, 4.2830810546875, 4.56298828125, 4.8428955078125, 5.122802734375, 5.4027099609375, 5.6826171875, 5.9625244140625, 6.242431640625, 6.5223388671875, 6.80224609375, 7.0821533203125, 7.362060546875, 7.6419677734375, 7.921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 6.0, 8.0, 15.0, 17.0, 27.0, 30.0, 62.0, 69.0, 80.0, 126.0, 168.0, 243.0, 354.0, 519.0, 825.0, 1268.0, 2129.0, 3388.0, 6329.0, 13207.0, 46986.0, 471690.0, 2929203.0, 622923.0, 62956.0, 14921.0, 7000.0, 3668.0, 2220.0, 1325.0, 771.0, 582.0, 384.0, 243.0, 172.0, 108.0, 75.0, 65.0, 32.0, 25.0, 15.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-23.328125, -22.68994140625, -22.0517578125, -21.41357421875, -20.775390625, -20.13720703125, -19.4990234375, -18.86083984375, -18.22265625, -17.58447265625, -16.9462890625, -16.30810546875, -15.669921875, -15.03173828125, -14.3935546875, -13.75537109375, -13.1171875, -12.47900390625, -11.8408203125, -11.20263671875, -10.564453125, -9.92626953125, -9.2880859375, -8.64990234375, -8.01171875, -7.37353515625, -6.7353515625, -6.09716796875, -5.458984375, -4.82080078125, -4.1826171875, -3.54443359375, -2.90625, -2.26806640625, -1.6298828125, -0.99169921875, -0.353515625, 0.28466796875, 0.9228515625, 1.56103515625, 2.19921875, 2.83740234375, 3.4755859375, 4.11376953125, 4.751953125, 5.39013671875, 6.0283203125, 6.66650390625, 7.3046875, 7.94287109375, 8.5810546875, 9.21923828125, 9.857421875, 10.49560546875, 11.1337890625, 11.77197265625, 12.41015625, 13.04833984375, 13.6865234375, 14.32470703125, 14.962890625, 15.60107421875, 16.2392578125, 16.87744140625, 17.515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 21.0, 19.0, 26.0, 38.0, 44.0, 61.0, 97.0, 172.0, 361.0, 688.0, 888.0, 653.0, 394.0, 191.0, 113.0, 57.0, 39.0, 39.0, 21.0, 28.0, 13.0, 11.0, 12.0, 8.0, 10.0, 5.0, 2.0, 8.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.270263671875, -24.49365234375, -23.717041015625, -22.9404296875, -22.163818359375, -21.38720703125, -20.610595703125, -19.833984375, -19.057373046875, -18.28076171875, -17.504150390625, -16.7275390625, -15.950927734375, -15.17431640625, -14.397705078125, -13.62109375, -12.844482421875, -12.06787109375, -11.291259765625, -10.5146484375, -9.738037109375, -8.96142578125, -8.184814453125, -7.408203125, -6.631591796875, -5.85498046875, -5.078369140625, -4.3017578125, -3.525146484375, -2.74853515625, -1.971923828125, -1.1953125, -0.418701171875, 0.35791015625, 1.134521484375, 1.9111328125, 2.687744140625, 3.46435546875, 4.240966796875, 5.017578125, 5.794189453125, 6.57080078125, 7.347412109375, 8.1240234375, 8.900634765625, 9.67724609375, 10.453857421875, 11.23046875, 12.007080078125, 12.78369140625, 13.560302734375, 14.3369140625, 15.113525390625, 15.89013671875, 16.666748046875, 17.443359375, 18.219970703125, 18.99658203125, 19.773193359375, 20.5498046875, 21.326416015625, 22.10302734375, 22.879638671875, 23.65625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 27.0, 23.0, 35.0, 56.0, 67.0, 121.0, 164.0, 235.0, 450.0, 669.0, 1146.0, 1891.0, 3316.0, 6232.0, 12220.0, 27491.0, 79096.0, 563008.0, 3055936.0, 333827.0, 61755.0, 23047.0, 10693.0, 5328.0, 2979.0, 1704.0, 968.0, 596.0, 421.0, 259.0, 182.0, 96.0, 68.0, 48.0, 26.0, 22.0, 18.0, 13.0, 13.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.484375, -23.678955078125, -22.87353515625, -22.068115234375, -21.2626953125, -20.457275390625, -19.65185546875, -18.846435546875, -18.041015625, -17.235595703125, -16.43017578125, -15.624755859375, -14.8193359375, -14.013916015625, -13.20849609375, -12.403076171875, -11.59765625, -10.792236328125, -9.98681640625, -9.181396484375, -8.3759765625, -7.570556640625, -6.76513671875, -5.959716796875, -5.154296875, -4.348876953125, -3.54345703125, -2.738037109375, -1.9326171875, -1.127197265625, -0.32177734375, 0.483642578125, 1.2890625, 2.094482421875, 2.89990234375, 3.705322265625, 4.5107421875, 5.316162109375, 6.12158203125, 6.927001953125, 7.732421875, 8.537841796875, 9.34326171875, 10.148681640625, 10.9541015625, 11.759521484375, 12.56494140625, 13.370361328125, 14.17578125, 14.981201171875, 15.78662109375, 16.592041015625, 17.3974609375, 18.202880859375, 19.00830078125, 19.813720703125, 20.619140625, 21.424560546875, 22.22998046875, 23.035400390625, 23.8408203125, 24.646240234375, 25.45166015625, 26.257080078125, 27.0625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 35.0, 91.0, 262.0, 384.0, 162.0, 47.0, 16.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.69752502441406, -81.86127471923828, -73.02503204345703, -64.18878173828125, -55.352535247802734, -46.51628875732422, -37.68003845214844, -28.843791961669922, -20.007545471191406, -11.171298027038574, -2.335050582885742, 6.501197814941406, 15.337444305419922, 24.173690795898438, 33.00994110107422, 41.846187591552734, 50.68243408203125, 59.518680572509766, 68.35492706298828, 77.19117736816406, 86.02742004394531, 94.8636703491211, 103.69992065429688, 112.53616333007812, 121.3724136352539, 130.2086639404297, 139.04490661621094, 147.88116455078125, 156.7174072265625, 165.55364990234375, 174.389892578125, 183.2261505126953, 192.06240844726562, 200.89865112304688, 209.7349090576172, 218.57115173339844, 227.4073944091797, 236.24365234375, 245.07989501953125, 253.9161376953125, 262.75238037109375, 271.588623046875, 280.42486572265625, 289.2611083984375, 298.0973815917969, 306.9336242675781, 315.7698669433594, 324.6061096191406, 333.4423828125, 342.27862548828125, 351.1148681640625, 359.95111083984375, 368.7873840332031, 377.6236267089844, 386.4598693847656, 395.2961120605469, 404.1323547363281, 412.9685974121094, 421.8048400878906, 430.64111328125, 439.47735595703125, 448.3135986328125, 457.14984130859375, 465.986083984375, 474.82232666015625]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 7.0, 8.0, 14.0, 11.0, 21.0, 20.0, 16.0, 22.0, 28.0, 28.0, 30.0, 33.0, 44.0, 39.0, 36.0, 40.0, 44.0, 35.0, 41.0, 33.0, 46.0, 37.0, 33.0, 41.0, 28.0, 34.0, 25.0, 34.0, 23.0, 23.0, 25.0, 18.0, 7.0, 11.0, 5.0, 13.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.72080993652344, -66.65535736083984, -64.58990478515625, -62.52445983886719, -60.459007263183594, -58.3935546875, -56.32810592651367, -54.262657165527344, -52.19720458984375, -50.131752014160156, -48.06630325317383, -46.0008544921875, -43.935401916503906, -41.86994934082031, -39.804500579833984, -37.739051818847656, -35.67359924316406, -33.60814666748047, -31.54269790649414, -29.47724723815918, -27.41179656982422, -25.346345901489258, -23.280895233154297, -21.215444564819336, -19.149993896484375, -17.084543228149414, -15.019092559814453, -12.953641891479492, -10.888191223144531, -8.82274055480957, -6.757289886474609, -4.691839218139648, -2.6263885498046875, -0.5609378814697266, 1.5045127868652344, 3.5699634552001953, 5.635414123535156, 7.700864791870117, 9.766315460205078, 11.831766128540039, 13.897216796875, 15.962667465209961, 18.028118133544922, 20.093568801879883, 22.159019470214844, 24.224470138549805, 26.289920806884766, 28.355371475219727, 30.420822143554688, 32.48627471923828, 34.55172348022461, 36.61717224121094, 38.68262481689453, 40.748077392578125, 42.81352615356445, 44.87897491455078, 46.944427490234375, 49.00988006591797, 51.0753288269043, 53.140777587890625, 55.20623016357422, 57.27168273925781, 59.33713150024414, 61.40258026123047, 63.46803283691406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 21.0, 25.0, 47.0, 53.0, 105.0, 137.0, 198.0, 228.0, 347.0, 453.0, 694.0, 941.0, 1414.0, 2069.0, 3031.0, 4375.0, 6617.0, 9942.0, 15281.0, 23662.0, 37226.0, 59597.0, 96489.0, 158861.0, 222728.0, 151581.0, 92177.0, 56968.0, 35597.0, 22982.0, 14834.0, 9638.0, 6352.0, 4185.0, 2967.0, 2014.0, 1423.0, 1015.0, 695.0, 458.0, 341.0, 241.0, 164.0, 117.0, 65.0, 59.0, 33.0, 27.0, 17.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0], "bins": [-0.1878662109375, -0.1822509765625, -0.1766357421875, -0.1710205078125, -0.1654052734375, -0.1597900390625, -0.1541748046875, -0.1485595703125, -0.1429443359375, -0.1373291015625, -0.1317138671875, -0.1260986328125, -0.1204833984375, -0.1148681640625, -0.1092529296875, -0.1036376953125, -0.0980224609375, -0.0924072265625, -0.0867919921875, -0.0811767578125, -0.0755615234375, -0.0699462890625, -0.0643310546875, -0.0587158203125, -0.0531005859375, -0.0474853515625, -0.0418701171875, -0.0362548828125, -0.0306396484375, -0.0250244140625, -0.0194091796875, -0.0137939453125, -0.0081787109375, -0.0025634765625, 0.0030517578125, 0.0086669921875, 0.0142822265625, 0.0198974609375, 0.0255126953125, 0.0311279296875, 0.0367431640625, 0.0423583984375, 0.0479736328125, 0.0535888671875, 0.0592041015625, 0.0648193359375, 0.0704345703125, 0.0760498046875, 0.0816650390625, 0.0872802734375, 0.0928955078125, 0.0985107421875, 0.1041259765625, 0.1097412109375, 0.1153564453125, 0.1209716796875, 0.1265869140625, 0.1322021484375, 0.1378173828125, 0.1434326171875, 0.1490478515625, 0.1546630859375, 0.1602783203125, 0.1658935546875, 0.1715087890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 16.0, 12.0, 14.0, 24.0, 17.0, 28.0, 28.0, 36.0, 27.0, 30.0, 31.0, 31.0, 31.0, 35.0, 35.0, 1070.0, 39.0, 27.0, 44.0, 28.0, 46.0, 42.0, 26.0, 31.0, 26.0, 29.0, 19.0, 16.0, 25.0, 14.0, 10.0, 17.0, 11.0, 14.0, 4.0, 14.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-5.1953125, -5.03619384765625, -4.8770751953125, -4.71795654296875, -4.558837890625, -4.39971923828125, -4.2406005859375, -4.08148193359375, -3.92236328125, -3.76324462890625, -3.6041259765625, -3.44500732421875, -3.285888671875, -3.12677001953125, -2.9676513671875, -2.80853271484375, -2.6494140625, -2.49029541015625, -2.3311767578125, -2.17205810546875, -2.012939453125, -1.85382080078125, -1.6947021484375, -1.53558349609375, -1.37646484375, -1.21734619140625, -1.0582275390625, -0.89910888671875, -0.739990234375, -0.58087158203125, -0.4217529296875, -0.26263427734375, -0.103515625, 0.05560302734375, 0.2147216796875, 0.37384033203125, 0.532958984375, 0.69207763671875, 0.8511962890625, 1.01031494140625, 1.16943359375, 1.32855224609375, 1.4876708984375, 1.64678955078125, 1.805908203125, 1.96502685546875, 2.1241455078125, 2.28326416015625, 2.4423828125, 2.60150146484375, 2.7606201171875, 2.91973876953125, 3.078857421875, 3.23797607421875, 3.3970947265625, 3.55621337890625, 3.71533203125, 3.87445068359375, 4.0335693359375, 4.19268798828125, 4.351806640625, 4.51092529296875, 4.6700439453125, 4.82916259765625, 4.98828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 9.0, 25.0, 38.0, 44.0, 83.0, 102.0, 144.0, 184.0, 316.0, 453.0, 682.0, 929.0, 1320.0, 1859.0, 2735.0, 4058.0, 5818.0, 8463.0, 12004.0, 17327.0, 24558.0, 35361.0, 50418.0, 72972.0, 107421.0, 165542.0, 1205452.0, 117356.0, 79724.0, 55293.0, 38362.0, 26893.0, 18773.0, 12894.0, 8941.0, 6372.0, 4322.0, 3013.0, 2126.0, 1457.0, 977.0, 686.0, 489.0, 362.0, 253.0, 153.0, 114.0, 80.0, 55.0, 37.0, 23.0, 11.0, 13.0, 7.0, 6.0, 6.0, 2.0, 1.0], "bins": [-0.07403564453125, -0.0717306137084961, -0.06942558288574219, -0.06712055206298828, -0.06481552124023438, -0.06251049041748047, -0.06020545959472656, -0.057900428771972656, -0.05559539794921875, -0.053290367126464844, -0.05098533630371094, -0.04868030548095703, -0.046375274658203125, -0.04407024383544922, -0.04176521301269531, -0.039460182189941406, -0.0371551513671875, -0.034850120544433594, -0.03254508972167969, -0.03024005889892578, -0.027935028076171875, -0.02562999725341797, -0.023324966430664062, -0.021019935607910156, -0.01871490478515625, -0.016409873962402344, -0.014104843139648438, -0.011799812316894531, -0.009494781494140625, -0.007189750671386719, -0.0048847198486328125, -0.0025796890258789062, -0.000274658203125, 0.0020303726196289062, 0.0043354034423828125, 0.006640434265136719, 0.008945465087890625, 0.011250495910644531, 0.013555526733398438, 0.015860557556152344, 0.01816558837890625, 0.020470619201660156, 0.022775650024414062, 0.02508068084716797, 0.027385711669921875, 0.02969074249267578, 0.03199577331542969, 0.034300804138183594, 0.0366058349609375, 0.038910865783691406, 0.04121589660644531, 0.04352092742919922, 0.045825958251953125, 0.04813098907470703, 0.05043601989746094, 0.052741050720214844, 0.05504608154296875, 0.057351112365722656, 0.05965614318847656, 0.06196117401123047, 0.06426620483398438, 0.06657123565673828, 0.06887626647949219, 0.0711812973022461, 0.073486328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 15.0, 14.0, 15.0, 16.0, 21.0, 23.0, 21.0, 36.0, 47.0, 50.0, 57.0, 60.0, 68.0, 62.0, 59.0, 59.0, 58.0, 52.0, 47.0, 43.0, 36.0, 20.0, 20.0, 19.0, 14.0, 15.0, 10.0, 6.0, 8.0, 4.0, 10.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008215904235839844, -0.0007985308766365051, -0.0007754713296890259, -0.0007524117827415466, -0.0007293522357940674, -0.0007062926888465881, -0.0006832331418991089, -0.0006601735949516296, -0.0006371140480041504, -0.0006140545010566711, -0.0005909949541091919, -0.0005679354071617126, -0.0005448758602142334, -0.0005218163132667542, -0.0004987567663192749, -0.00047569721937179565, -0.0004526376724243164, -0.00042957812547683716, -0.0004065185785293579, -0.00038345903158187866, -0.0003603994846343994, -0.00033733993768692017, -0.0003142803907394409, -0.00029122084379196167, -0.0002681612968444824, -0.0002451017498970032, -0.00022204220294952393, -0.00019898265600204468, -0.00017592310905456543, -0.00015286356210708618, -0.00012980401515960693, -0.00010674446821212769, -8.368492126464844e-05, -6.062537431716919e-05, -3.756582736968994e-05, -1.4506280422210693e-05, 8.553266525268555e-06, 3.16128134727478e-05, 5.467236042022705e-05, 7.77319073677063e-05, 0.00010079145431518555, 0.0001238510012626648, 0.00014691054821014404, 0.0001699700951576233, 0.00019302964210510254, 0.0002160891890525818, 0.00023914873600006104, 0.0002622082829475403, 0.00028526782989501953, 0.0003083273768424988, 0.00033138692378997803, 0.0003544464707374573, 0.0003775060176849365, 0.00040056556463241577, 0.000423625111579895, 0.00044668465852737427, 0.0004697442054748535, 0.0004928037524223328, 0.000515863299369812, 0.0005389228463172913, 0.0005619823932647705, 0.0005850419402122498, 0.000608101487159729, 0.0006311610341072083, 0.0006542205810546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 5.0, 9.0, 6.0, 15.0, 15.0, 15.0, 21.0, 41.0, 31.0, 60.0, 86.0, 140.0, 161.0, 229.0, 417.0, 1007.0, 26295.0, 1011221.0, 6912.0, 742.0, 356.0, 224.0, 150.0, 106.0, 76.0, 62.0, 42.0, 31.0, 25.0, 17.0, 18.0, 4.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01171112060546875, -0.011298298835754395, -0.010885477066040039, -0.010472655296325684, -0.010059833526611328, -0.009647011756896973, -0.009234189987182617, -0.008821368217468262, -0.008408546447753906, -0.00799572467803955, -0.007582902908325195, -0.00717008113861084, -0.006757259368896484, -0.006344437599182129, -0.0059316158294677734, -0.005518794059753418, -0.0051059722900390625, -0.004693150520324707, -0.0042803287506103516, -0.003867506980895996, -0.0034546852111816406, -0.003041863441467285, -0.0026290416717529297, -0.0022162199020385742, -0.0018033981323242188, -0.0013905763626098633, -0.0009777545928955078, -0.0005649328231811523, -0.00015211105346679688, 0.0002607107162475586, 0.0006735324859619141, 0.0010863542556762695, 0.001499176025390625, 0.0019119977951049805, 0.002324819564819336, 0.0027376413345336914, 0.003150463104248047, 0.0035632848739624023, 0.003976106643676758, 0.004388928413391113, 0.004801750183105469, 0.005214571952819824, 0.00562739372253418, 0.006040215492248535, 0.006453037261962891, 0.006865859031677246, 0.0072786808013916016, 0.007691502571105957, 0.008104324340820312, 0.008517146110534668, 0.008929967880249023, 0.009342789649963379, 0.009755611419677734, 0.01016843318939209, 0.010581254959106445, 0.0109940767288208, 0.011406898498535156, 0.011819720268249512, 0.012232542037963867, 0.012645363807678223, 0.013058185577392578, 0.013471007347106934, 0.013883829116821289, 0.014296650886535645, 0.01470947265625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 925.0, 84.0, 0.0, 1.0], "bins": [-0.025905147194862366, -0.025479130446910858, -0.02505311369895935, -0.024627096951007843, -0.024201078340411186, -0.02377506159245968, -0.02334904484450817, -0.022923028096556664, -0.022497011348605156, -0.02207099460065365, -0.02164497785270214, -0.021218961104750633, -0.020792942494153976, -0.02036692574620247, -0.01994090899825096, -0.019514892250299454, -0.019088875502347946, -0.01866285875439644, -0.01823684200644493, -0.017810825258493423, -0.017384806647896767, -0.01695878989994526, -0.01653277315199375, -0.016106756404042244, -0.015680739656090736, -0.015254722908139229, -0.014828705228865147, -0.014402688480913639, -0.013976671732962132, -0.01355065405368805, -0.013124637305736542, -0.012698620557785034, -0.012272601947188377, -0.01184658519923687, -0.011420567519962788, -0.01099455077201128, -0.010568534024059772, -0.01014251634478569, -0.009716499596834183, -0.009290482848882675, -0.008864466100931168, -0.00843844935297966, -0.008012431673705578, -0.00758641492575407, -0.007160398177802563, -0.006734380964189768, -0.006308363750576973, -0.005882347002625465, -0.005456330254673958, -0.005030313041061163, -0.004604296293109655, -0.0041782790794968605, -0.003752262331545353, -0.003326245117932558, -0.002900228137150407, -0.0024742111563682556, -0.0020481941755861044, -0.0016221771948039532, -0.001196160214021802, -0.0007701431168243289, -0.0003441261360421777, 8.189096115529537e-05, 0.0005079079419374466, 0.0009339249227195978, 0.001359941903501749]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 12.0, 8.0, 11.0, 20.0, 14.0, 41.0, 46.0, 60.0, 61.0, 74.0, 79.0, 85.0, 81.0, 68.0, 61.0, 64.0, 59.0, 39.0, 32.0, 27.0, 27.0, 15.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008486509323120117, -0.0008117500692605972, -0.0007748492062091827, -0.0007379483431577682, -0.0007010474801063538, -0.0006641466170549393, -0.0006272457540035248, -0.0005903448909521103, -0.0005534440279006958, -0.0005165431648492813, -0.0004796423017978668, -0.00044274143874645233, -0.00040584057569503784, -0.00036893971264362335, -0.00033203884959220886, -0.00029513798654079437, -0.0002582371234893799, -0.0002213362604379654, -0.0001844353973865509, -0.00014753453433513641, -0.00011063367128372192, -7.373280823230743e-05, -3.6831945180892944e-05, 6.891787052154541e-08, 3.6969780921936035e-05, 7.387064397335052e-05, 0.00011077150702476501, 0.0001476723700761795, 0.000184573233127594, 0.00022147409617900848, 0.000258374959230423, 0.00029527582228183746, 0.00033217668533325195, 0.00036907754838466644, 0.00040597841143608093, 0.0004428792744874954, 0.0004797801375389099, 0.0005166810005903244, 0.0005535818636417389, 0.0005904827266931534, 0.0006273835897445679, 0.0006642844527959824, 0.0007011853158473969, 0.0007380861788988113, 0.0007749870419502258, 0.0008118879050016403, 0.0008487887680530548, 0.0008856896311044693, 0.0009225904941558838, 0.0009594913572072983, 0.0009963922202587128, 0.0010332930833101273, 0.0010701939463615417, 0.0011070948094129562, 0.0011439956724643707, 0.0011808965355157852, 0.0012177973985671997, 0.0012546982616186142, 0.0012915991246700287, 0.0013284999877214432, 0.0013654008507728577, 0.0014023017138242722, 0.0014392025768756866, 0.0014761034399271011, 0.0015130043029785156]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 11.0, 2.0, 2.0, 9.0, 11.0, 7.0, 12.0, 22.0, 30.0, 54.0, 58.0, 74.0, 108.0, 144.0, 199.0, 315.0, 424.0, 593.0, 866.0, 1339.0, 2117.0, 3457.0, 5796.0, 11233.0, 25894.0, 183710.0, 739638.0, 39274.0, 14551.0, 7086.0, 4091.0, 2462.0, 1636.0, 1008.0, 668.0, 522.0, 348.0, 214.0, 159.0, 94.0, 94.0, 72.0, 48.0, 31.0, 16.0, 18.0, 16.0, 2.0, 9.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.765625, -17.135009765625, -16.50439453125, -15.873779296875, -15.2431640625, -14.612548828125, -13.98193359375, -13.351318359375, -12.720703125, -12.090087890625, -11.45947265625, -10.828857421875, -10.1982421875, -9.567626953125, -8.93701171875, -8.306396484375, -7.67578125, -7.045166015625, -6.41455078125, -5.783935546875, -5.1533203125, -4.522705078125, -3.89208984375, -3.261474609375, -2.630859375, -2.000244140625, -1.36962890625, -0.739013671875, -0.1083984375, 0.522216796875, 1.15283203125, 1.783447265625, 2.4140625, 3.044677734375, 3.67529296875, 4.305908203125, 4.9365234375, 5.567138671875, 6.19775390625, 6.828369140625, 7.458984375, 8.089599609375, 8.72021484375, 9.350830078125, 9.9814453125, 10.612060546875, 11.24267578125, 11.873291015625, 12.50390625, 13.134521484375, 13.76513671875, 14.395751953125, 15.0263671875, 15.656982421875, 16.28759765625, 16.918212890625, 17.548828125, 18.179443359375, 18.81005859375, 19.440673828125, 20.0712890625, 20.701904296875, 21.33251953125, 21.963134765625, 22.59375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 4.0, 10.0, 12.0, 12.0, 18.0, 19.0, 12.0, 16.0, 24.0, 32.0, 24.0, 33.0, 41.0, 47.0, 52.0, 63.0, 102.0, 195.0, 1676.0, 104.0, 85.0, 56.0, 51.0, 51.0, 41.0, 35.0, 32.0, 24.0, 30.0, 26.0, 17.0, 16.0, 16.0, 15.0, 13.0, 5.0, 7.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.785400390625, -25.89892578125, -25.012451171875, -24.1259765625, -23.239501953125, -22.35302734375, -21.466552734375, -20.580078125, -19.693603515625, -18.80712890625, -17.920654296875, -17.0341796875, -16.147705078125, -15.26123046875, -14.374755859375, -13.48828125, -12.601806640625, -11.71533203125, -10.828857421875, -9.9423828125, -9.055908203125, -8.16943359375, -7.282958984375, -6.396484375, -5.510009765625, -4.62353515625, -3.737060546875, -2.8505859375, -1.964111328125, -1.07763671875, -0.191162109375, 0.6953125, 1.581787109375, 2.46826171875, 3.354736328125, 4.2412109375, 5.127685546875, 6.01416015625, 6.900634765625, 7.787109375, 8.673583984375, 9.56005859375, 10.446533203125, 11.3330078125, 12.219482421875, 13.10595703125, 13.992431640625, 14.87890625, 15.765380859375, 16.65185546875, 17.538330078125, 18.4248046875, 19.311279296875, 20.19775390625, 21.084228515625, 21.970703125, 22.857177734375, 23.74365234375, 24.630126953125, 25.5166015625, 26.403076171875, 27.28955078125, 28.176025390625, 29.0625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 16.0, 17.0, 26.0, 38.0, 42.0, 51.0, 55.0, 95.0, 130.0, 190.0, 445.0, 1245.0, 5268.0, 31459.0, 2813722.0, 271290.0, 16682.0, 3204.0, 841.0, 291.0, 159.0, 95.0, 77.0, 64.0, 35.0, 20.0, 16.0, 15.0, 11.0, 15.0, 13.0, 8.0, 9.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0, -56.23388671875, -54.4677734375, -52.70166015625, -50.935546875, -49.16943359375, -47.4033203125, -45.63720703125, -43.87109375, -42.10498046875, -40.3388671875, -38.57275390625, -36.806640625, -35.04052734375, -33.2744140625, -31.50830078125, -29.7421875, -27.97607421875, -26.2099609375, -24.44384765625, -22.677734375, -20.91162109375, -19.1455078125, -17.37939453125, -15.61328125, -13.84716796875, -12.0810546875, -10.31494140625, -8.548828125, -6.78271484375, -5.0166015625, -3.25048828125, -1.484375, 0.28173828125, 2.0478515625, 3.81396484375, 5.580078125, 7.34619140625, 9.1123046875, 10.87841796875, 12.64453125, 14.41064453125, 16.1767578125, 17.94287109375, 19.708984375, 21.47509765625, 23.2412109375, 25.00732421875, 26.7734375, 28.53955078125, 30.3056640625, 32.07177734375, 33.837890625, 35.60400390625, 37.3701171875, 39.13623046875, 40.90234375, 42.66845703125, 44.4345703125, 46.20068359375, 47.966796875, 49.73291015625, 51.4990234375, 53.26513671875, 55.03125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 228.0, 721.0, 54.0, 3.0, 1.0, 1.0], "bins": [-819.880126953125, -806.0418090820312, -792.2034912109375, -778.3651733398438, -764.5269165039062, -750.6885986328125, -736.8502807617188, -723.011962890625, -709.1736450195312, -695.3353271484375, -681.4970092773438, -667.65869140625, -653.8204345703125, -639.9821166992188, -626.143798828125, -612.3054809570312, -598.4671630859375, -584.6288452148438, -570.79052734375, -556.9522094726562, -543.1139526367188, -529.275634765625, -515.4373168945312, -501.5989990234375, -487.7607116699219, -473.9223937988281, -460.0841064453125, -446.24578857421875, -432.407470703125, -418.56915283203125, -404.7308654785156, -390.8925476074219, -377.05419921875, -363.21588134765625, -349.3775939941406, -335.5392761230469, -321.7009582519531, -307.8626708984375, -294.02435302734375, -280.18603515625, -266.34771728515625, -252.50941467285156, -238.6710968017578, -224.83279418945312, -210.99447631835938, -197.1561737060547, -183.31787109375, -169.47955322265625, -155.64126586914062, -141.80296325683594, -127.96464538574219, -114.1263427734375, -100.28802490234375, -86.44972229003906, -72.61141204833984, -58.773101806640625, -44.934783935546875, -31.096473693847656, -17.25816535949707, -3.4198570251464844, 10.418453216552734, 24.256759643554688, 38.095069885253906, 51.933380126953125, 65.77169036865234]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 27.0, 18.0, 16.0, 21.0, 32.0, 36.0, 41.0, 29.0, 28.0, 37.0, 37.0, 37.0, 33.0, 47.0, 53.0, 40.0, 33.0, 42.0, 36.0, 33.0, 35.0, 32.0, 24.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 12.0, 10.0, 7.0, 5.0, 6.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.90670776367188, -73.55231475830078, -71.19792175292969, -68.84353637695312, -66.48914337158203, -64.13475036621094, -61.78036117553711, -59.42597198486328, -57.07157897949219, -54.717185974121094, -52.362796783447266, -50.00840759277344, -47.654014587402344, -45.29962158203125, -42.94523239135742, -40.590843200683594, -38.2364501953125, -35.882057189941406, -33.52766799926758, -31.173276901245117, -28.818885803222656, -26.464494705200195, -24.110103607177734, -21.755712509155273, -19.401321411132812, -17.04693031311035, -14.69253921508789, -12.33814811706543, -9.983757019042969, -7.629365921020508, -5.274974822998047, -2.920583724975586, -0.5661849975585938, 1.7882061004638672, 4.142597198486328, 6.496988296508789, 8.85137939453125, 11.205770492553711, 13.560161590576172, 15.914552688598633, 18.268943786621094, 20.623334884643555, 22.977725982666016, 25.332117080688477, 27.686508178710938, 30.0408992767334, 32.39529037475586, 34.74967956542969, 37.10407257080078, 39.458465576171875, 41.8128547668457, 44.16724395751953, 46.521636962890625, 48.87602996826172, 51.23041915893555, 53.584808349609375, 55.93920135498047, 58.29359436035156, 60.64798355102539, 63.00237274169922, 65.35676574707031, 67.7111587524414, 70.0655517578125, 72.41993713378906, 74.77433013916016]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 3.0, 7.0, 11.0, 11.0, 7.0, 15.0, 12.0, 23.0, 19.0, 21.0, 33.0, 28.0, 32.0, 43.0, 35.0, 39.0, 28.0, 55.0, 32.0, 48.0, 33.0, 60.0, 29.0, 41.0, 33.0, 33.0, 34.0, 38.0, 29.0, 24.0, 16.0, 21.0, 16.0, 14.0, 9.0, 10.0, 9.0, 12.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-9.75, -9.4827880859375, -9.215576171875, -8.9483642578125, -8.68115234375, -8.4139404296875, -8.146728515625, -7.8795166015625, -7.6123046875, -7.3450927734375, -7.077880859375, -6.8106689453125, -6.54345703125, -6.2762451171875, -6.009033203125, -5.7418212890625, -5.474609375, -5.2073974609375, -4.940185546875, -4.6729736328125, -4.40576171875, -4.1385498046875, -3.871337890625, -3.6041259765625, -3.3369140625, -3.0697021484375, -2.802490234375, -2.5352783203125, -2.26806640625, -2.0008544921875, -1.733642578125, -1.4664306640625, -1.19921875, -0.9320068359375, -0.664794921875, -0.3975830078125, -0.13037109375, 0.1368408203125, 0.404052734375, 0.6712646484375, 0.9384765625, 1.2056884765625, 1.472900390625, 1.7401123046875, 2.00732421875, 2.2745361328125, 2.541748046875, 2.8089599609375, 3.076171875, 3.3433837890625, 3.610595703125, 3.8778076171875, 4.14501953125, 4.4122314453125, 4.679443359375, 4.9466552734375, 5.2138671875, 5.4810791015625, 5.748291015625, 6.0155029296875, 6.28271484375, 6.5499267578125, 6.817138671875, 7.0843505859375, 7.3515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 11.0, 15.0, 15.0, 12.0, 22.0, 34.0, 57.0, 68.0, 96.0, 182.0, 251.0, 438.0, 821.0, 1523.0, 3208.0, 7767.0, 23776.0, 437568.0, 3552986.0, 137312.0, 16442.0, 6118.0, 2630.0, 1255.0, 663.0, 381.0, 211.0, 120.0, 91.0, 47.0, 38.0, 25.0, 12.0, 14.0, 18.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-41.65625, -40.510498046875, -39.36474609375, -38.218994140625, -37.0732421875, -35.927490234375, -34.78173828125, -33.635986328125, -32.490234375, -31.344482421875, -30.19873046875, -29.052978515625, -27.9072265625, -26.761474609375, -25.61572265625, -24.469970703125, -23.32421875, -22.178466796875, -21.03271484375, -19.886962890625, -18.7412109375, -17.595458984375, -16.44970703125, -15.303955078125, -14.158203125, -13.012451171875, -11.86669921875, -10.720947265625, -9.5751953125, -8.429443359375, -7.28369140625, -6.137939453125, -4.9921875, -3.846435546875, -2.70068359375, -1.554931640625, -0.4091796875, 0.736572265625, 1.88232421875, 3.028076171875, 4.173828125, 5.319580078125, 6.46533203125, 7.611083984375, 8.7568359375, 9.902587890625, 11.04833984375, 12.194091796875, 13.33984375, 14.485595703125, 15.63134765625, 16.777099609375, 17.9228515625, 19.068603515625, 20.21435546875, 21.360107421875, 22.505859375, 23.651611328125, 24.79736328125, 25.943115234375, 27.0888671875, 28.234619140625, 29.38037109375, 30.526123046875, 31.671875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 15.0, 12.0, 15.0, 17.0, 17.0, 24.0, 38.0, 53.0, 71.0, 132.0, 229.0, 444.0, 746.0, 794.0, 574.0, 324.0, 178.0, 100.0, 70.0, 48.0, 29.0, 27.0, 19.0, 14.0, 18.0, 8.0, 2.0, 3.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.015625, -24.2841796875, -23.552734375, -22.8212890625, -22.08984375, -21.3583984375, -20.626953125, -19.8955078125, -19.1640625, -18.4326171875, -17.701171875, -16.9697265625, -16.23828125, -15.5068359375, -14.775390625, -14.0439453125, -13.3125, -12.5810546875, -11.849609375, -11.1181640625, -10.38671875, -9.6552734375, -8.923828125, -8.1923828125, -7.4609375, -6.7294921875, -5.998046875, -5.2666015625, -4.53515625, -3.8037109375, -3.072265625, -2.3408203125, -1.609375, -0.8779296875, -0.146484375, 0.5849609375, 1.31640625, 2.0478515625, 2.779296875, 3.5107421875, 4.2421875, 4.9736328125, 5.705078125, 6.4365234375, 7.16796875, 7.8994140625, 8.630859375, 9.3623046875, 10.09375, 10.8251953125, 11.556640625, 12.2880859375, 13.01953125, 13.7509765625, 14.482421875, 15.2138671875, 15.9453125, 16.6767578125, 17.408203125, 18.1396484375, 18.87109375, 19.6025390625, 20.333984375, 21.0654296875, 21.796875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 9.0, 14.0, 23.0, 30.0, 48.0, 81.0, 208.0, 443.0, 1143.0, 3506.0, 12403.0, 68974.0, 3424518.0, 638717.0, 32670.0, 7762.0, 2304.0, 775.0, 284.0, 132.0, 75.0, 39.0, 17.0, 20.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0, -53.1552734375, -51.310546875, -49.4658203125, -47.62109375, -45.7763671875, -43.931640625, -42.0869140625, -40.2421875, -38.3974609375, -36.552734375, -34.7080078125, -32.86328125, -31.0185546875, -29.173828125, -27.3291015625, -25.484375, -23.6396484375, -21.794921875, -19.9501953125, -18.10546875, -16.2607421875, -14.416015625, -12.5712890625, -10.7265625, -8.8818359375, -7.037109375, -5.1923828125, -3.34765625, -1.5029296875, 0.341796875, 2.1865234375, 4.03125, 5.8759765625, 7.720703125, 9.5654296875, 11.41015625, 13.2548828125, 15.099609375, 16.9443359375, 18.7890625, 20.6337890625, 22.478515625, 24.3232421875, 26.16796875, 28.0126953125, 29.857421875, 31.7021484375, 33.546875, 35.3916015625, 37.236328125, 39.0810546875, 40.92578125, 42.7705078125, 44.615234375, 46.4599609375, 48.3046875, 50.1494140625, 51.994140625, 53.8388671875, 55.68359375, 57.5283203125, 59.373046875, 61.2177734375, 63.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 15.0, 40.0, 86.0, 210.0, 314.0, 184.0, 99.0, 24.0, 27.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.27145385742188, -189.37081909179688, -182.47018432617188, -175.56954956054688, -168.66891479492188, -161.76828002929688, -154.86764526367188, -147.96701049804688, -141.06637573242188, -134.16574096679688, -127.26510620117188, -120.36447143554688, -113.46383666992188, -106.56320190429688, -99.66256713867188, -92.76193237304688, -85.8613052368164, -78.9606704711914, -72.0600357055664, -65.1594009399414, -58.258766174316406, -51.35813522338867, -44.45750045776367, -37.55686569213867, -30.656230926513672, -23.755596160888672, -16.854961395263672, -9.954328536987305, -3.0536937713623047, 3.8469390869140625, 10.747573852539062, 17.648208618164062, 24.548843383789062, 31.449478149414062, 38.35011291503906, 45.25074768066406, 52.15138244628906, 59.0520133972168, 65.95265197753906, 72.85328674316406, 79.75392150878906, 86.65455627441406, 93.55519104003906, 100.45582580566406, 107.35646057128906, 114.25709533691406, 121.15773010253906, 128.05836486816406, 134.958984375, 141.859619140625, 148.76025390625, 155.660888671875, 162.5615234375, 169.462158203125, 176.36279296875, 183.263427734375, 190.1640625, 197.064697265625, 203.96533203125, 210.865966796875, 217.7666015625, 224.667236328125, 231.56787109375, 238.468505859375, 245.369140625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 6.0, 10.0, 9.0, 7.0, 10.0, 17.0, 26.0, 30.0, 27.0, 28.0, 32.0, 30.0, 27.0, 36.0, 43.0, 42.0, 41.0, 38.0, 53.0, 38.0, 33.0, 44.0, 44.0, 43.0, 29.0, 22.0, 38.0, 25.0, 19.0, 15.0, 20.0, 23.0, 10.0, 13.0, 11.0, 14.0, 13.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.88423156738281, -72.79228210449219, -70.70033264160156, -68.60838317871094, -66.51644134521484, -64.42449188232422, -62.332542419433594, -60.24059295654297, -58.148643493652344, -56.05669403076172, -53.96474838256836, -51.872798919677734, -49.78084945678711, -47.68890380859375, -45.596954345703125, -43.5050048828125, -41.41305923461914, -39.321109771728516, -37.229164123535156, -35.13721466064453, -33.045265197753906, -30.953317642211914, -28.861370086669922, -26.769420623779297, -24.677473068237305, -22.585525512695312, -20.493576049804688, -18.401628494262695, -16.309680938720703, -14.217731475830078, -12.125783920288086, -10.033835411071777, -7.941886901855469, -5.84993839263916, -3.7579903602600098, -1.6660423278808594, 0.4259061813354492, 2.517854690551758, 4.60980224609375, 6.701750755310059, 8.793699264526367, 10.885647773742676, 12.977596282958984, 15.069543838500977, 17.16149139404297, 19.253440856933594, 21.345388412475586, 23.437335968017578, 25.529285430908203, 27.621232986450195, 29.71318244934082, 31.805130004882812, 33.89707946777344, 35.98902893066406, 38.08097457885742, 40.17292404174805, 42.264869689941406, 44.35681915283203, 46.44876480102539, 48.540714263916016, 50.63266372680664, 52.724609375, 54.816558837890625, 56.90850830078125, 59.000457763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 1.0, 1.0, 7.0, 20.0, 17.0, 34.0, 47.0, 69.0, 93.0, 124.0, 181.0, 264.0, 393.0, 505.0, 738.0, 1009.0, 1464.0, 2066.0, 3055.0, 4376.0, 6269.0, 8951.0, 13424.0, 19406.0, 28473.0, 42531.0, 64072.0, 97826.0, 151342.0, 200244.0, 134636.0, 88194.0, 58135.0, 38539.0, 25528.0, 17286.0, 12057.0, 8230.0, 5719.0, 3911.0, 2701.0, 1952.0, 1444.0, 928.0, 693.0, 463.0, 328.0, 237.0, 154.0, 119.0, 88.0, 67.0, 40.0, 46.0, 28.0, 8.0, 13.0, 7.0, 2.0, 8.0, 3.0], "bins": [-0.1748046875, -0.1694049835205078, -0.16400527954101562, -0.15860557556152344, -0.15320587158203125, -0.14780616760253906, -0.14240646362304688, -0.1370067596435547, -0.1316070556640625, -0.1262073516845703, -0.12080764770507812, -0.11540794372558594, -0.11000823974609375, -0.10460853576660156, -0.09920883178710938, -0.09380912780761719, -0.088409423828125, -0.08300971984863281, -0.07761001586914062, -0.07221031188964844, -0.06681060791015625, -0.06141090393066406, -0.056011199951171875, -0.05061149597167969, -0.0452117919921875, -0.03981208801269531, -0.034412384033203125, -0.029012680053710938, -0.02361297607421875, -0.018213272094726562, -0.012813568115234375, -0.0074138641357421875, -0.00201416015625, 0.0033855438232421875, 0.008785247802734375, 0.014184951782226562, 0.01958465576171875, 0.024984359741210938, 0.030384063720703125, 0.03578376770019531, 0.0411834716796875, 0.04658317565917969, 0.051982879638671875, 0.05738258361816406, 0.06278228759765625, 0.06818199157714844, 0.07358169555664062, 0.07898139953613281, 0.084381103515625, 0.08978080749511719, 0.09518051147460938, 0.10058021545410156, 0.10597991943359375, 0.11137962341308594, 0.11677932739257812, 0.12217903137207031, 0.1275787353515625, 0.1329784393310547, 0.13837814331054688, 0.14377784729003906, 0.14917755126953125, 0.15457725524902344, 0.15997695922851562, 0.1653766632080078, 0.1707763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 10.0, 15.0, 13.0, 17.0, 18.0, 25.0, 32.0, 25.0, 28.0, 31.0, 41.0, 42.0, 35.0, 51.0, 48.0, 1069.0, 42.0, 55.0, 38.0, 43.0, 39.0, 49.0, 35.0, 31.0, 31.0, 30.0, 13.0, 19.0, 22.0, 15.0, 12.0, 7.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.85986328125, -5.6416015625, -5.42333984375, -5.205078125, -4.98681640625, -4.7685546875, -4.55029296875, -4.33203125, -4.11376953125, -3.8955078125, -3.67724609375, -3.458984375, -3.24072265625, -3.0224609375, -2.80419921875, -2.5859375, -2.36767578125, -2.1494140625, -1.93115234375, -1.712890625, -1.49462890625, -1.2763671875, -1.05810546875, -0.83984375, -0.62158203125, -0.4033203125, -0.18505859375, 0.033203125, 0.25146484375, 0.4697265625, 0.68798828125, 0.90625, 1.12451171875, 1.3427734375, 1.56103515625, 1.779296875, 1.99755859375, 2.2158203125, 2.43408203125, 2.65234375, 2.87060546875, 3.0888671875, 3.30712890625, 3.525390625, 3.74365234375, 3.9619140625, 4.18017578125, 4.3984375, 4.61669921875, 4.8349609375, 5.05322265625, 5.271484375, 5.48974609375, 5.7080078125, 5.92626953125, 6.14453125, 6.36279296875, 6.5810546875, 6.79931640625, 7.017578125, 7.23583984375, 7.4541015625, 7.67236328125, 7.890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 17.0, 7.0, 20.0, 31.0, 38.0, 83.0, 112.0, 166.0, 242.0, 401.0, 580.0, 948.0, 1546.0, 2628.0, 4222.0, 6810.0, 11519.0, 18829.0, 31381.0, 52477.0, 87954.0, 150086.0, 1282605.0, 181280.0, 105781.0, 62148.0, 37637.0, 22703.0, 13740.0, 8270.0, 4869.0, 3094.0, 1859.0, 1127.0, 695.0, 425.0, 293.0, 170.0, 121.0, 74.0, 51.0, 35.0, 19.0, 16.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1103515625, -0.10686779022216797, -0.10338401794433594, -0.0999002456665039, -0.09641647338867188, -0.09293270111083984, -0.08944892883300781, -0.08596515655517578, -0.08248138427734375, -0.07899761199951172, -0.07551383972167969, -0.07203006744384766, -0.06854629516601562, -0.0650625228881836, -0.06157875061035156, -0.05809497833251953, -0.0546112060546875, -0.05112743377685547, -0.04764366149902344, -0.044159889221191406, -0.040676116943359375, -0.037192344665527344, -0.03370857238769531, -0.03022480010986328, -0.02674102783203125, -0.02325725555419922, -0.019773483276367188, -0.016289710998535156, -0.012805938720703125, -0.009322166442871094, -0.0058383941650390625, -0.0023546218872070312, 0.001129150390625, 0.004612922668457031, 0.008096694946289062, 0.011580467224121094, 0.015064239501953125, 0.018548011779785156, 0.022031784057617188, 0.02551555633544922, 0.02899932861328125, 0.03248310089111328, 0.03596687316894531, 0.039450645446777344, 0.042934417724609375, 0.046418190002441406, 0.04990196228027344, 0.05338573455810547, 0.0568695068359375, 0.06035327911376953, 0.06383705139160156, 0.0673208236694336, 0.07080459594726562, 0.07428836822509766, 0.07777214050292969, 0.08125591278076172, 0.08473968505859375, 0.08822345733642578, 0.09170722961425781, 0.09519100189208984, 0.09867477416992188, 0.1021585464477539, 0.10564231872558594, 0.10912609100341797, 0.11260986328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 5.0, 6.0, 20.0, 16.0, 32.0, 24.0, 32.0, 34.0, 32.0, 45.0, 49.0, 51.0, 46.0, 50.0, 59.0, 53.0, 47.0, 56.0, 40.0, 30.0, 42.0, 29.0, 31.0, 16.0, 26.0, 16.0, 17.0, 17.0, 9.0, 12.0, 4.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0008707046508789062, -0.000844612717628479, -0.0008185207843780518, -0.0007924288511276245, -0.0007663369178771973, -0.00074024498462677, -0.0007141530513763428, -0.0006880611181259155, -0.0006619691848754883, -0.000635877251625061, -0.0006097853183746338, -0.0005836933851242065, -0.0005576014518737793, -0.000531509518623352, -0.0005054175853729248, -0.00047932565212249756, -0.0004532337188720703, -0.00042714178562164307, -0.0004010498523712158, -0.0003749579191207886, -0.00034886598587036133, -0.0003227740526199341, -0.00029668211936950684, -0.0002705901861190796, -0.00024449825286865234, -0.0002184063196182251, -0.00019231438636779785, -0.0001662224531173706, -0.00014013051986694336, -0.00011403858661651611, -8.794665336608887e-05, -6.185472011566162e-05, -3.5762786865234375e-05, -9.670853614807129e-06, 1.6421079635620117e-05, 4.251301288604736e-05, 6.860494613647461e-05, 9.469687938690186e-05, 0.0001207888126373291, 0.00014688074588775635, 0.0001729726791381836, 0.00019906461238861084, 0.00022515654563903809, 0.00025124847888946533, 0.0002773404121398926, 0.0003034323453903198, 0.00032952427864074707, 0.0003556162118911743, 0.00038170814514160156, 0.0004078000783920288, 0.00043389201164245605, 0.0004599839448928833, 0.00048607587814331055, 0.0005121678113937378, 0.000538259744644165, 0.0005643516778945923, 0.0005904436111450195, 0.0006165355443954468, 0.000642627477645874, 0.0006687194108963013, 0.0006948113441467285, 0.0007209032773971558, 0.000746995210647583, 0.0007730871438980103, 0.0007991790771484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 11.0, 13.0, 19.0, 24.0, 16.0, 39.0, 31.0, 45.0, 72.0, 88.0, 135.0, 273.0, 415.0, 882.0, 7228.0, 985463.0, 50863.0, 1447.0, 498.0, 285.0, 204.0, 133.0, 95.0, 56.0, 51.0, 44.0, 26.0, 17.0, 10.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01458740234375, -0.014112234115600586, -0.013637065887451172, -0.013161897659301758, -0.012686729431152344, -0.01221156120300293, -0.011736392974853516, -0.011261224746704102, -0.010786056518554688, -0.010310888290405273, -0.00983572006225586, -0.009360551834106445, -0.008885383605957031, -0.008410215377807617, -0.007935047149658203, -0.007459878921508789, -0.006984710693359375, -0.006509542465209961, -0.006034374237060547, -0.005559206008911133, -0.005084037780761719, -0.004608869552612305, -0.004133701324462891, -0.0036585330963134766, -0.0031833648681640625, -0.0027081966400146484, -0.0022330284118652344, -0.0017578601837158203, -0.0012826919555664062, -0.0008075237274169922, -0.0003323554992675781, 0.00014281272888183594, 0.00061798095703125, 0.001093149185180664, 0.0015683174133300781, 0.002043485641479492, 0.0025186538696289062, 0.0029938220977783203, 0.0034689903259277344, 0.0039441585540771484, 0.0044193267822265625, 0.0048944950103759766, 0.005369663238525391, 0.005844831466674805, 0.006319999694824219, 0.006795167922973633, 0.007270336151123047, 0.007745504379272461, 0.008220672607421875, 0.008695840835571289, 0.009171009063720703, 0.009646177291870117, 0.010121345520019531, 0.010596513748168945, 0.01107168197631836, 0.011546850204467773, 0.012022018432617188, 0.012497186660766602, 0.012972354888916016, 0.01344752311706543, 0.013922691345214844, 0.014397859573364258, 0.014873027801513672, 0.015348196029663086, 0.0158233642578125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 105.0, 876.0, 28.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.017937416210770607, -0.017613166943192482, -0.017288919538259506, -0.01696467027068138, -0.016640421003103256, -0.01631617359817028, -0.015991924330592155, -0.01566767506301403, -0.01534342672675848, -0.01501917839050293, -0.014694929122924805, -0.014370680786669254, -0.014046432450413704, -0.013722183182835579, -0.013397934846580029, -0.013073686510324478, -0.012749437242746353, -0.012425188906490803, -0.012100939638912678, -0.011776691302657127, -0.011452442035079002, -0.011128193698823452, -0.010803945362567902, -0.010479696094989777, -0.010155447758734226, -0.009831199422478676, -0.00950695015490055, -0.009182701818645, -0.00885845348238945, -0.008534204214811325, -0.008209955878555775, -0.007885707542300224, -0.007561459206044674, -0.007237210404127836, -0.0069129616022109985, -0.006588713265955448, -0.0062644644640386105, -0.005940215662121773, -0.005615967325866222, -0.005291718523949385, -0.004967469722032547, -0.004643220920115709, -0.004318972118198872, -0.003994723781943321, -0.0036704749800264835, -0.003346226178109646, -0.003021977609023452, -0.0026977290399372578, -0.0023734800051897764, -0.0020492314361035824, -0.0017249826341867447, -0.0014007339486852288, -0.001076485263183713, -0.0007522365776821971, -0.00042798789218068123, -0.00010373932309448719, 0.0002205094788223505, 0.0005447581643238664, 0.0008690068498253822, 0.001193255535326898, 0.001517504220828414, 0.0018417529063299298, 0.0021660015918314457, 0.0024902501609176397, 0.0028144989628344774]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 14.0, 16.0, 16.0, 29.0, 17.0, 28.0, 31.0, 42.0, 40.0, 52.0, 39.0, 45.0, 40.0, 58.0, 48.0, 45.0, 48.0, 54.0, 63.0, 46.0, 46.0, 34.0, 22.0, 21.0, 20.0, 12.0, 13.0, 11.0, 14.0, 9.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010572606697678566, -0.0010235179215669632, -0.0009897751733660698, -0.0009560324251651764, -0.000922289676964283, -0.0008885469287633896, -0.0008548041805624962, -0.0008210614323616028, -0.0007873186841607094, -0.000753575935959816, -0.0007198331877589226, -0.0006860904395580292, -0.0006523476913571358, -0.0006186049431562424, -0.000584862194955349, -0.0005511194467544556, -0.0005173766985535622, -0.00048363395035266876, -0.00044989120215177536, -0.00041614845395088196, -0.00038240570574998856, -0.00034866295754909515, -0.00031492020934820175, -0.00028117746114730835, -0.00024743471294641495, -0.00021369196474552155, -0.00017994921654462814, -0.00014620646834373474, -0.00011246372014284134, -7.872097194194794e-05, -4.4978223741054535e-05, -1.1235475540161133e-05, 2.250727266073227e-05, 5.625002086162567e-05, 8.999276906251907e-05, 0.00012373551726341248, 0.00015747826546430588, 0.00019122101366519928, 0.00022496376186609268, 0.0002587065100669861, 0.0002924492582678795, 0.0003261920064687729, 0.0003599347546696663, 0.0003936775028705597, 0.0004274202510714531, 0.0004611629992723465, 0.0004949057474732399, 0.0005286484956741333, 0.0005623912438750267, 0.0005961339920759201, 0.0006298767402768135, 0.0006636194884777069, 0.0006973622366786003, 0.0007311049848794937, 0.0007648477330803871, 0.0007985904812812805, 0.0008323332294821739, 0.0008660759776830673, 0.0008998187258839607, 0.0009335614740848541, 0.0009673042222857475, 0.001001046970486641, 0.0010347897186875343, 0.0010685324668884277]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 6.0, 17.0, 12.0, 29.0, 30.0, 39.0, 49.0, 79.0, 101.0, 141.0, 187.0, 277.0, 410.0, 602.0, 999.0, 1652.0, 2833.0, 5441.0, 12591.0, 40454.0, 603973.0, 321894.0, 33530.0, 11141.0, 5022.0, 2613.0, 1537.0, 946.0, 615.0, 412.0, 297.0, 171.0, 132.0, 81.0, 72.0, 41.0, 28.0, 24.0, 13.0, 13.0, 15.0, 8.0, 3.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203125, -23.36669921875, -22.5302734375, -21.69384765625, -20.857421875, -20.02099609375, -19.1845703125, -18.34814453125, -17.51171875, -16.67529296875, -15.8388671875, -15.00244140625, -14.166015625, -13.32958984375, -12.4931640625, -11.65673828125, -10.8203125, -9.98388671875, -9.1474609375, -8.31103515625, -7.474609375, -6.63818359375, -5.8017578125, -4.96533203125, -4.12890625, -3.29248046875, -2.4560546875, -1.61962890625, -0.783203125, 0.05322265625, 0.8896484375, 1.72607421875, 2.5625, 3.39892578125, 4.2353515625, 5.07177734375, 5.908203125, 6.74462890625, 7.5810546875, 8.41748046875, 9.25390625, 10.09033203125, 10.9267578125, 11.76318359375, 12.599609375, 13.43603515625, 14.2724609375, 15.10888671875, 15.9453125, 16.78173828125, 17.6181640625, 18.45458984375, 19.291015625, 20.12744140625, 20.9638671875, 21.80029296875, 22.63671875, 23.47314453125, 24.3095703125, 25.14599609375, 25.982421875, 26.81884765625, 27.6552734375, 28.49169921875, 29.328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 3.0, 5.0, 7.0, 8.0, 5.0, 11.0, 10.0, 19.0, 27.0, 19.0, 36.0, 29.0, 36.0, 34.0, 45.0, 45.0, 51.0, 98.0, 171.0, 1685.0, 175.0, 88.0, 64.0, 34.0, 47.0, 36.0, 38.0, 40.0, 31.0, 29.0, 16.0, 19.0, 24.0, 9.0, 16.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.07666015625, -32.0595703125, -31.04248046875, -30.025390625, -29.00830078125, -27.9912109375, -26.97412109375, -25.95703125, -24.93994140625, -23.9228515625, -22.90576171875, -21.888671875, -20.87158203125, -19.8544921875, -18.83740234375, -17.8203125, -16.80322265625, -15.7861328125, -14.76904296875, -13.751953125, -12.73486328125, -11.7177734375, -10.70068359375, -9.68359375, -8.66650390625, -7.6494140625, -6.63232421875, -5.615234375, -4.59814453125, -3.5810546875, -2.56396484375, -1.546875, -0.52978515625, 0.4873046875, 1.50439453125, 2.521484375, 3.53857421875, 4.5556640625, 5.57275390625, 6.58984375, 7.60693359375, 8.6240234375, 9.64111328125, 10.658203125, 11.67529296875, 12.6923828125, 13.70947265625, 14.7265625, 15.74365234375, 16.7607421875, 17.77783203125, 18.794921875, 19.81201171875, 20.8291015625, 21.84619140625, 22.86328125, 23.88037109375, 24.8974609375, 25.91455078125, 26.931640625, 27.94873046875, 28.9658203125, 29.98291015625, 31.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 12.0, 6.0, 17.0, 14.0, 31.0, 37.0, 30.0, 39.0, 104.0, 133.0, 281.0, 532.0, 1206.0, 3287.0, 11054.0, 77604.0, 2945764.0, 87569.0, 11888.0, 3543.0, 1342.0, 528.0, 235.0, 117.0, 81.0, 54.0, 37.0, 33.0, 25.0, 11.0, 17.0, 11.0, 10.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.6689453125, -46.900390625, -45.1318359375, -43.36328125, -41.5947265625, -39.826171875, -38.0576171875, -36.2890625, -34.5205078125, -32.751953125, -30.9833984375, -29.21484375, -27.4462890625, -25.677734375, -23.9091796875, -22.140625, -20.3720703125, -18.603515625, -16.8349609375, -15.06640625, -13.2978515625, -11.529296875, -9.7607421875, -7.9921875, -6.2236328125, -4.455078125, -2.6865234375, -0.91796875, 0.8505859375, 2.619140625, 4.3876953125, 6.15625, 7.9248046875, 9.693359375, 11.4619140625, 13.23046875, 14.9990234375, 16.767578125, 18.5361328125, 20.3046875, 22.0732421875, 23.841796875, 25.6103515625, 27.37890625, 29.1474609375, 30.916015625, 32.6845703125, 34.453125, 36.2216796875, 37.990234375, 39.7587890625, 41.52734375, 43.2958984375, 45.064453125, 46.8330078125, 48.6015625, 50.3701171875, 52.138671875, 53.9072265625, 55.67578125, 57.4443359375, 59.212890625, 60.9814453125, 62.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 41.0, 905.0, 74.0, 0.0, 1.0], "bins": [-1604.9996337890625, -1578.48681640625, -1551.973876953125, -1525.4610595703125, -1498.9482421875, -1472.435302734375, -1445.9224853515625, -1419.40966796875, -1392.896728515625, -1366.3839111328125, -1339.8709716796875, -1313.358154296875, -1286.8453369140625, -1260.3323974609375, -1233.819580078125, -1207.3067626953125, -1180.7939453125, -1154.2811279296875, -1127.7681884765625, -1101.25537109375, -1074.7425537109375, -1048.2296142578125, -1021.716796875, -995.2039794921875, -968.6910400390625, -942.1781616210938, -915.6653442382812, -889.1524658203125, -862.6395874023438, -836.1267700195312, -809.6138916015625, -783.10107421875, -756.5881958007812, -730.0753173828125, -703.5625, -677.0496215820312, -650.5367431640625, -624.02392578125, -597.5110473632812, -570.9981689453125, -544.4853515625, -517.9724731445312, -491.4596252441406, -464.94677734375, -438.4339294433594, -411.92108154296875, -385.408203125, -358.8953552246094, -332.3824768066406, -305.86962890625, -279.35675048828125, -252.84390258789062, -226.3310546875, -199.8181915283203, -173.30532836914062, -146.79248046875, -120.27960968017578, -93.76675415039062, -67.25389099121094, -40.74103546142578, -14.228179931640625, 12.284675598144531, 38.79753875732422, 65.31038665771484, 91.82324981689453]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 4.0, 12.0, 13.0, 13.0, 26.0, 14.0, 19.0, 21.0, 27.0, 23.0, 37.0, 28.0, 40.0, 42.0, 29.0, 41.0, 22.0, 38.0, 32.0, 43.0, 49.0, 45.0, 31.0, 37.0, 34.0, 26.0, 23.0, 31.0, 29.0, 23.0, 20.0, 16.0, 14.0, 16.0, 15.0, 8.0, 8.0, 6.0, 5.0, 9.0, 8.0, 1.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.74593353271484, -77.18772888183594, -74.62952423095703, -72.07131958007812, -69.51311492919922, -66.95491027832031, -64.3967056274414, -61.8385009765625, -59.280296325683594, -56.72209167480469, -54.16388702392578, -51.605682373046875, -49.04747772216797, -46.48927307128906, -43.931068420410156, -41.37286376953125, -38.814659118652344, -36.25645446777344, -33.69824981689453, -31.140045166015625, -28.58184051513672, -26.023635864257812, -23.465431213378906, -20.9072265625, -18.349021911621094, -15.790817260742188, -13.232612609863281, -10.674407958984375, -8.116203308105469, -5.5579986572265625, -2.9997940063476562, -0.44158935546875, 2.116607666015625, 4.674812316894531, 7.2330169677734375, 9.791221618652344, 12.34942626953125, 14.907630920410156, 17.465835571289062, 20.02404022216797, 22.582244873046875, 25.14044952392578, 27.698654174804688, 30.256858825683594, 32.8150634765625, 35.373268127441406, 37.93147277832031, 40.48967742919922, 43.047882080078125, 45.60608673095703, 48.16429138183594, 50.722496032714844, 53.28070068359375, 55.838905334472656, 58.39710998535156, 60.95531463623047, 63.513519287109375, 66.07172393798828, 68.62992858886719, 71.1881332397461, 73.746337890625, 76.3045425415039, 78.86274719238281, 81.42095184326172, 83.97915649414062]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 10.0, 9.0, 9.0, 8.0, 13.0, 13.0, 17.0, 21.0, 17.0, 19.0, 39.0, 29.0, 35.0, 23.0, 49.0, 43.0, 52.0, 40.0, 33.0, 50.0, 46.0, 40.0, 48.0, 43.0, 36.0, 33.0, 27.0, 30.0, 21.0, 16.0, 24.0, 18.0, 10.0, 11.0, 11.0, 11.0, 3.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.0859375, -10.7911376953125, -10.496337890625, -10.2015380859375, -9.90673828125, -9.6119384765625, -9.317138671875, -9.0223388671875, -8.7275390625, -8.4327392578125, -8.137939453125, -7.8431396484375, -7.54833984375, -7.2535400390625, -6.958740234375, -6.6639404296875, -6.369140625, -6.0743408203125, -5.779541015625, -5.4847412109375, -5.18994140625, -4.8951416015625, -4.600341796875, -4.3055419921875, -4.0107421875, -3.7159423828125, -3.421142578125, -3.1263427734375, -2.83154296875, -2.5367431640625, -2.241943359375, -1.9471435546875, -1.65234375, -1.3575439453125, -1.062744140625, -0.7679443359375, -0.47314453125, -0.1783447265625, 0.116455078125, 0.4112548828125, 0.7060546875, 1.0008544921875, 1.295654296875, 1.5904541015625, 1.88525390625, 2.1800537109375, 2.474853515625, 2.7696533203125, 3.064453125, 3.3592529296875, 3.654052734375, 3.9488525390625, 4.24365234375, 4.5384521484375, 4.833251953125, 5.1280517578125, 5.4228515625, 5.7176513671875, 6.012451171875, 6.3072509765625, 6.60205078125, 6.8968505859375, 7.191650390625, 7.4864501953125, 7.78125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 13.0, 10.0, 14.0, 12.0, 25.0, 33.0, 32.0, 57.0, 64.0, 73.0, 134.0, 181.0, 224.0, 320.0, 443.0, 570.0, 811.0, 1209.0, 1734.0, 2636.0, 4021.0, 6601.0, 11650.0, 23663.0, 105516.0, 713560.0, 2444780.0, 706215.0, 110818.0, 27797.0, 11982.0, 6706.0, 4052.0, 2649.0, 1754.0, 1129.0, 821.0, 567.0, 398.0, 285.0, 234.0, 138.0, 94.0, 78.0, 60.0, 35.0, 28.0, 27.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0], "bins": [-19.03125, -18.5098876953125, -17.988525390625, -17.4671630859375, -16.94580078125, -16.4244384765625, -15.903076171875, -15.3817138671875, -14.8603515625, -14.3389892578125, -13.817626953125, -13.2962646484375, -12.77490234375, -12.2535400390625, -11.732177734375, -11.2108154296875, -10.689453125, -10.1680908203125, -9.646728515625, -9.1253662109375, -8.60400390625, -8.0826416015625, -7.561279296875, -7.0399169921875, -6.5185546875, -5.9971923828125, -5.475830078125, -4.9544677734375, -4.43310546875, -3.9117431640625, -3.390380859375, -2.8690185546875, -2.34765625, -1.8262939453125, -1.304931640625, -0.7835693359375, -0.26220703125, 0.2591552734375, 0.780517578125, 1.3018798828125, 1.8232421875, 2.3446044921875, 2.865966796875, 3.3873291015625, 3.90869140625, 4.4300537109375, 4.951416015625, 5.4727783203125, 5.994140625, 6.5155029296875, 7.036865234375, 7.5582275390625, 8.07958984375, 8.6009521484375, 9.122314453125, 9.6436767578125, 10.1650390625, 10.6864013671875, 11.207763671875, 11.7291259765625, 12.25048828125, 12.7718505859375, 13.293212890625, 13.8145751953125, 14.3359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 10.0, 6.0, 8.0, 9.0, 10.0, 17.0, 20.0, 34.0, 45.0, 45.0, 83.0, 159.0, 280.0, 540.0, 933.0, 876.0, 426.0, 205.0, 122.0, 71.0, 46.0, 33.0, 12.0, 14.0, 23.0, 13.0, 6.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.1875, -29.267578125, -28.34765625, -27.427734375, -26.5078125, -25.587890625, -24.66796875, -23.748046875, -22.828125, -21.908203125, -20.98828125, -20.068359375, -19.1484375, -18.228515625, -17.30859375, -16.388671875, -15.46875, -14.548828125, -13.62890625, -12.708984375, -11.7890625, -10.869140625, -9.94921875, -9.029296875, -8.109375, -7.189453125, -6.26953125, -5.349609375, -4.4296875, -3.509765625, -2.58984375, -1.669921875, -0.75, 0.169921875, 1.08984375, 2.009765625, 2.9296875, 3.849609375, 4.76953125, 5.689453125, 6.609375, 7.529296875, 8.44921875, 9.369140625, 10.2890625, 11.208984375, 12.12890625, 13.048828125, 13.96875, 14.888671875, 15.80859375, 16.728515625, 17.6484375, 18.568359375, 19.48828125, 20.408203125, 21.328125, 22.248046875, 23.16796875, 24.087890625, 25.0078125, 25.927734375, 26.84765625, 27.767578125, 28.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 10.0, 12.0, 19.0, 51.0, 47.0, 87.0, 137.0, 303.0, 674.0, 1636.0, 4902.0, 18757.0, 129255.0, 3709487.0, 290481.0, 27887.0, 6676.0, 2196.0, 792.0, 374.0, 195.0, 106.0, 70.0, 34.0, 25.0, 19.0, 10.0, 9.0, 11.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.59375, -51.84375, -50.09375, -48.34375, -46.59375, -44.84375, -43.09375, -41.34375, -39.59375, -37.84375, -36.09375, -34.34375, -32.59375, -30.84375, -29.09375, -27.34375, -25.59375, -23.84375, -22.09375, -20.34375, -18.59375, -16.84375, -15.09375, -13.34375, -11.59375, -9.84375, -8.09375, -6.34375, -4.59375, -2.84375, -1.09375, 0.65625, 2.40625, 4.15625, 5.90625, 7.65625, 9.40625, 11.15625, 12.90625, 14.65625, 16.40625, 18.15625, 19.90625, 21.65625, 23.40625, 25.15625, 26.90625, 28.65625, 30.40625, 32.15625, 33.90625, 35.65625, 37.40625, 39.15625, 40.90625, 42.65625, 44.40625, 46.15625, 47.90625, 49.65625, 51.40625, 53.15625, 54.90625, 56.65625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 15.0, 27.0, 76.0, 109.0, 251.0, 253.0, 145.0, 53.0, 36.0, 20.0, 9.0, 8.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.91897583007812, -145.04087829589844, -138.16278076171875, -131.28468322753906, -124.40658569335938, -117.52848815917969, -110.650390625, -103.77229309082031, -96.89419555664062, -90.01609802246094, -83.13800048828125, -76.25990295410156, -69.38180541992188, -62.50370407104492, -55.625606536865234, -48.74750900268555, -41.869407653808594, -34.991310119628906, -28.11321258544922, -21.2351131439209, -14.357015609741211, -7.478916168212891, -0.6008186340332031, 6.277278900146484, 13.155376434326172, 20.03347396850586, 26.911571502685547, 33.7896728515625, 40.66777038574219, 47.545867919921875, 54.42396545410156, 61.30206298828125, 68.18016052246094, 75.05825805664062, 81.93635559082031, 88.814453125, 95.69255065917969, 102.57064819335938, 109.44874572753906, 116.32684326171875, 123.20494079589844, 130.08303833007812, 136.9611358642578, 143.8392333984375, 150.7173309326172, 157.59542846679688, 164.47352600097656, 171.35162353515625, 178.229736328125, 185.1078338623047, 191.98593139648438, 198.86402893066406, 205.74212646484375, 212.62022399902344, 219.49832153320312, 226.3764190673828, 233.2545166015625, 240.1326141357422, 247.01071166992188, 253.88880920410156, 260.76690673828125, 267.64501953125, 274.5231018066406, 281.4012145996094, 288.279296875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 12.0, 9.0, 10.0, 10.0, 20.0, 25.0, 9.0, 16.0, 26.0, 19.0, 25.0, 32.0, 40.0, 28.0, 41.0, 42.0, 36.0, 45.0, 40.0, 40.0, 36.0, 34.0, 39.0, 42.0, 33.0, 29.0, 27.0, 36.0, 20.0, 27.0, 23.0, 18.0, 18.0, 14.0, 8.0, 13.0, 11.0, 9.0, 8.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-65.20747375488281, -63.1240234375, -61.04057312011719, -58.957122802734375, -56.8736686706543, -54.790218353271484, -52.70676803588867, -50.62331771850586, -48.53986358642578, -46.45641326904297, -44.372962951660156, -42.289512634277344, -40.206058502197266, -38.12260818481445, -36.03915786743164, -33.95570755004883, -31.872257232666016, -29.788806915283203, -27.705354690551758, -25.621904373168945, -23.5384521484375, -21.455001831054688, -19.371551513671875, -17.288101196289062, -15.204648971557617, -13.121197700500488, -11.03774642944336, -8.954296112060547, -6.870844841003418, -4.787393569946289, -2.7039432525634766, -0.6204919815063477, 1.4629592895507812, 3.546410322189331, 5.629861354827881, 7.713312149047852, 9.79676342010498, 11.88021469116211, 13.963665008544922, 16.047115325927734, 18.13056755065918, 20.214017868041992, 22.297470092773438, 24.38092041015625, 26.464370727539062, 28.547822952270508, 30.63127326965332, 32.714725494384766, 34.79817581176758, 36.88162612915039, 38.9650764465332, 41.04853057861328, 43.131980895996094, 45.215431213378906, 47.29888153076172, 49.38233184814453, 51.465782165527344, 53.549232482910156, 55.63268280029297, 57.71613311767578, 59.79958724975586, 61.88303756713867, 63.966487884521484, 66.04994201660156, 68.13339233398438]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 10.0, 14.0, 20.0, 25.0, 42.0, 72.0, 88.0, 129.0, 188.0, 327.0, 497.0, 747.0, 1119.0, 1762.0, 2568.0, 3867.0, 5786.0, 9041.0, 13290.0, 19871.0, 29675.0, 45765.0, 71796.0, 114046.0, 182441.0, 197268.0, 123555.0, 78405.0, 50117.0, 32502.0, 21442.0, 14371.0, 9249.0, 6104.0, 4169.0, 2805.0, 1818.0, 1197.0, 772.0, 532.0, 345.0, 228.0, 160.0, 110.0, 60.0, 50.0, 22.0, 31.0, 24.0, 8.0, 11.0, 4.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1983642578125, -0.1919841766357422, -0.18560409545898438, -0.17922401428222656, -0.17284393310546875, -0.16646385192871094, -0.16008377075195312, -0.1537036895751953, -0.1473236083984375, -0.1409435272216797, -0.13456344604492188, -0.12818336486816406, -0.12180328369140625, -0.11542320251464844, -0.10904312133789062, -0.10266304016113281, -0.096282958984375, -0.08990287780761719, -0.08352279663085938, -0.07714271545410156, -0.07076263427734375, -0.06438255310058594, -0.058002471923828125, -0.05162239074707031, -0.0452423095703125, -0.03886222839355469, -0.032482147216796875, -0.026102066040039062, -0.01972198486328125, -0.013341903686523438, -0.006961822509765625, -0.0005817413330078125, 0.00579833984375, 0.012178421020507812, 0.018558502197265625, 0.024938583374023438, 0.03131866455078125, 0.03769874572753906, 0.044078826904296875, 0.05045890808105469, 0.0568389892578125, 0.06321907043457031, 0.06959915161132812, 0.07597923278808594, 0.08235931396484375, 0.08873939514160156, 0.09511947631835938, 0.10149955749511719, 0.107879638671875, 0.11425971984863281, 0.12063980102539062, 0.12701988220214844, 0.13339996337890625, 0.13978004455566406, 0.14616012573242188, 0.1525402069091797, 0.1589202880859375, 0.1653003692626953, 0.17168045043945312, 0.17806053161621094, 0.18444061279296875, 0.19082069396972656, 0.19720077514648438, 0.2035808563232422, 0.2099609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 7.0, 17.0, 12.0, 11.0, 22.0, 24.0, 22.0, 29.0, 27.0, 25.0, 28.0, 26.0, 36.0, 45.0, 32.0, 45.0, 45.0, 1062.0, 40.0, 26.0, 34.0, 38.0, 33.0, 25.0, 33.0, 31.0, 21.0, 26.0, 32.0, 22.0, 21.0, 12.0, 12.0, 14.0, 16.0, 5.0, 15.0, 2.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.625, -6.41632080078125, -6.2076416015625, -5.99896240234375, -5.790283203125, -5.58160400390625, -5.3729248046875, -5.16424560546875, -4.95556640625, -4.74688720703125, -4.5382080078125, -4.32952880859375, -4.120849609375, -3.91217041015625, -3.7034912109375, -3.49481201171875, -3.2861328125, -3.07745361328125, -2.8687744140625, -2.66009521484375, -2.451416015625, -2.24273681640625, -2.0340576171875, -1.82537841796875, -1.61669921875, -1.40802001953125, -1.1993408203125, -0.99066162109375, -0.781982421875, -0.57330322265625, -0.3646240234375, -0.15594482421875, 0.052734375, 0.26141357421875, 0.4700927734375, 0.67877197265625, 0.887451171875, 1.09613037109375, 1.3048095703125, 1.51348876953125, 1.72216796875, 1.93084716796875, 2.1395263671875, 2.34820556640625, 2.556884765625, 2.76556396484375, 2.9742431640625, 3.18292236328125, 3.3916015625, 3.60028076171875, 3.8089599609375, 4.01763916015625, 4.226318359375, 4.43499755859375, 4.6436767578125, 4.85235595703125, 5.06103515625, 5.26971435546875, 5.4783935546875, 5.68707275390625, 5.895751953125, 6.10443115234375, 6.3131103515625, 6.52178955078125, 6.73046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 8.0, 13.0, 12.0, 23.0, 35.0, 37.0, 63.0, 95.0, 117.0, 174.0, 255.0, 344.0, 534.0, 687.0, 1041.0, 1453.0, 2057.0, 2982.0, 4537.0, 6308.0, 9226.0, 13232.0, 19364.0, 28493.0, 41017.0, 59968.0, 88889.0, 133187.0, 1227620.0, 146327.0, 98426.0, 66002.0, 44808.0, 31213.0, 21449.0, 14731.0, 9805.0, 6926.0, 4777.0, 3335.0, 2264.0, 1522.0, 1153.0, 769.0, 534.0, 372.0, 253.0, 214.0, 146.0, 82.0, 90.0, 55.0, 33.0, 29.0, 14.0, 13.0, 9.0, 4.0, 6.0, 3.0, 3.0], "bins": [-0.08935546875, -0.08652973175048828, -0.08370399475097656, -0.08087825775146484, -0.07805252075195312, -0.0752267837524414, -0.07240104675292969, -0.06957530975341797, -0.06674957275390625, -0.06392383575439453, -0.06109809875488281, -0.058272361755371094, -0.055446624755859375, -0.052620887756347656, -0.04979515075683594, -0.04696941375732422, -0.0441436767578125, -0.04131793975830078, -0.03849220275878906, -0.035666465759277344, -0.032840728759765625, -0.030014991760253906, -0.027189254760742188, -0.02436351776123047, -0.02153778076171875, -0.01871204376220703, -0.015886306762695312, -0.013060569763183594, -0.010234832763671875, -0.007409095764160156, -0.0045833587646484375, -0.0017576217651367188, 0.001068115234375, 0.0038938522338867188, 0.0067195892333984375, 0.009545326232910156, 0.012371063232421875, 0.015196800231933594, 0.018022537231445312, 0.02084827423095703, 0.02367401123046875, 0.02649974822998047, 0.029325485229492188, 0.032151222229003906, 0.034976959228515625, 0.037802696228027344, 0.04062843322753906, 0.04345417022705078, 0.0462799072265625, 0.04910564422607422, 0.05193138122558594, 0.054757118225097656, 0.057582855224609375, 0.060408592224121094, 0.06323432922363281, 0.06606006622314453, 0.06888580322265625, 0.07171154022216797, 0.07453727722167969, 0.0773630142211914, 0.08018875122070312, 0.08301448822021484, 0.08584022521972656, 0.08866596221923828, 0.09149169921875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 9.0, 8.0, 13.0, 10.0, 16.0, 15.0, 18.0, 29.0, 35.0, 31.0, 40.0, 52.0, 44.0, 55.0, 49.0, 56.0, 55.0, 39.0, 40.0, 43.0, 43.0, 42.0, 42.0, 36.0, 21.0, 30.0, 19.0, 14.0, 17.0, 9.0, 8.0, 12.0, 7.0, 2.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0010166168212890625, -0.0009859949350357056, -0.0009553730487823486, -0.0009247511625289917, -0.0008941292762756348, -0.0008635073900222778, -0.0008328855037689209, -0.000802263617515564, -0.000771641731262207, -0.0007410198450088501, -0.0007103979587554932, -0.0006797760725021362, -0.0006491541862487793, -0.0006185322999954224, -0.0005879104137420654, -0.0005572885274887085, -0.0005266666412353516, -0.0004960447549819946, -0.0004654228687286377, -0.00043480098247528076, -0.00040417909622192383, -0.0003735572099685669, -0.00034293532371520996, -0.00031231343746185303, -0.0002816915512084961, -0.00025106966495513916, -0.00022044777870178223, -0.0001898258924484253, -0.00015920400619506836, -0.00012858211994171143, -9.796023368835449e-05, -6.733834743499756e-05, -3.6716461181640625e-05, -6.094574928283691e-06, 2.4527311325073242e-05, 5.5149197578430176e-05, 8.577108383178711e-05, 0.00011639297008514404, 0.00014701485633850098, 0.0001776367425918579, 0.00020825862884521484, 0.00023888051509857178, 0.0002695024013519287, 0.00030012428760528564, 0.0003307461738586426, 0.0003613680601119995, 0.00039198994636535645, 0.0004226118326187134, 0.0004532337188720703, 0.00048385560512542725, 0.0005144774913787842, 0.0005450993776321411, 0.000575721263885498, 0.000606343150138855, 0.0006369650363922119, 0.0006675869226455688, 0.0006982088088989258, 0.0007288306951522827, 0.0007594525814056396, 0.0007900744676589966, 0.0008206963539123535, 0.0008513182401657104, 0.0008819401264190674, 0.0009125620126724243, 0.0009431838989257812]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 14.0, 13.0, 14.0, 18.0, 22.0, 28.0, 35.0, 75.0, 103.0, 158.0, 244.0, 480.0, 1127.0, 28473.0, 1008390.0, 7349.0, 879.0, 402.0, 216.0, 134.0, 83.0, 58.0, 50.0, 32.0, 25.0, 22.0, 12.0, 9.0, 11.0, 10.0, 7.0, 5.0, 10.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017810821533203125, -0.01720428466796875, -0.016597747802734375, -0.0159912109375, -0.015384674072265625, -0.01477813720703125, -0.014171600341796875, -0.0135650634765625, -0.012958526611328125, -0.01235198974609375, -0.011745452880859375, -0.011138916015625, -0.010532379150390625, -0.00992584228515625, -0.009319305419921875, -0.0087127685546875, -0.008106231689453125, -0.00749969482421875, -0.006893157958984375, -0.00628662109375, -0.005680084228515625, -0.00507354736328125, -0.004467010498046875, -0.0038604736328125, -0.003253936767578125, -0.00264739990234375, -0.002040863037109375, -0.001434326171875, -0.000827789306640625, -0.00022125244140625, 0.000385284423828125, 0.0009918212890625, 0.001598358154296875, 0.00220489501953125, 0.002811431884765625, 0.00341796875, 0.004024505615234375, 0.00463104248046875, 0.005237579345703125, 0.0058441162109375, 0.006450653076171875, 0.00705718994140625, 0.007663726806640625, 0.008270263671875, 0.008876800537109375, 0.00948333740234375, 0.010089874267578125, 0.0106964111328125, 0.011302947998046875, 0.01190948486328125, 0.012516021728515625, 0.01312255859375, 0.013729095458984375, 0.01433563232421875, 0.014942169189453125, 0.0155487060546875, 0.016155242919921875, 0.01676177978515625, 0.017368316650390625, 0.017974853515625, 0.018581390380859375, 0.01918792724609375, 0.019794464111328125, 0.0204010009765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 353.0, 658.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03300518915057182, -0.032426510006189346, -0.03184782713651657, -0.031269147992134094, -0.03069046512246132, -0.030111784115433693, -0.029533103108406067, -0.02895442396402359, -0.028375741094350815, -0.02779706008732319, -0.027218379080295563, -0.026639698073267937, -0.02606101706624031, -0.025482336059212685, -0.02490365505218506, -0.024324975907802582, -0.023746294900774956, -0.02316761389374733, -0.022588932886719704, -0.022010251879692078, -0.02143157087266445, -0.020852889865636826, -0.0202742088586092, -0.019695527851581573, -0.019116848707199097, -0.01853816770017147, -0.017959486693143845, -0.01738080568611622, -0.016802124679088593, -0.016223443672060966, -0.01564476266503334, -0.015066082589328289, -0.014487400650978088, -0.013908719643950462, -0.013330038636922836, -0.01275135762989521, -0.012172676622867584, -0.011593995615839958, -0.011015315540134907, -0.01043663453310728, -0.009857953526079655, -0.009279272519052029, -0.008700591512024403, -0.008121910504996777, -0.007543229963630438, -0.006964548956602812, -0.006385868415236473, -0.005807187408208847, -0.005228506401181221, -0.004649825394153595, -0.004071144387125969, -0.00349246384575963, -0.002913782838732004, -0.002335101831704378, -0.0017564210575073957, -0.0011777402833104134, -0.0005990592762827873, -2.0378385670483112e-05, 0.0005583025049418211, 0.0011369833955541253, 0.0017156642861664295, 0.0022943452931940556, 0.002873026067391038, 0.0034517068415880203, 0.004030387848615646]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 19.0, 19.0, 25.0, 21.0, 25.0, 35.0, 29.0, 41.0, 61.0, 56.0, 63.0, 64.0, 75.0, 64.0, 49.0, 62.0, 55.0, 37.0, 25.0, 27.0, 34.0, 18.0, 20.0, 16.0, 11.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001224815845489502, -0.0011795097962021828, -0.0011342037469148636, -0.0010888976976275444, -0.0010435916483402252, -0.000998285599052906, -0.0009529795497655869, -0.0009076735004782677, -0.0008623674511909485, -0.0008170614019036293, -0.0007717553526163101, -0.0007264493033289909, -0.0006811432540416718, -0.0006358372047543526, -0.0005905311554670334, -0.0005452251061797142, -0.000499919056892395, -0.00045461300760507584, -0.00040930695831775665, -0.00036400090903043747, -0.0003186948597431183, -0.0002733888104557991, -0.00022808276116847992, -0.00018277671188116074, -0.00013747066259384155, -9.216461330652237e-05, -4.6858564019203186e-05, -1.5525147318840027e-06, 4.375353455543518e-05, 8.905958384275436e-05, 0.00013436563313007355, 0.00017967168241739273, 0.00022497773170471191, 0.0002702837809920311, 0.0003155898302793503, 0.00036089587956666946, 0.00040620192885398865, 0.00045150797814130783, 0.000496814027428627, 0.0005421200767159462, 0.0005874261260032654, 0.0006327321752905846, 0.0006780382245779037, 0.0007233442738652229, 0.0007686503231525421, 0.0008139563724398613, 0.0008592624217271805, 0.0009045684710144997, 0.0009498745203018188, 0.000995180569589138, 0.0010404866188764572, 0.0010857926681637764, 0.0011310987174510956, 0.0011764047667384148, 0.001221710816025734, 0.0012670168653130531, 0.0013123229146003723, 0.0013576289638876915, 0.0014029350131750107, 0.0014482410624623299, 0.001493547111749649, 0.0015388531610369682, 0.0015841592103242874, 0.0016294652596116066, 0.0016747713088989258]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 11.0, 9.0, 22.0, 26.0, 38.0, 46.0, 56.0, 117.0, 130.0, 179.0, 292.0, 352.0, 610.0, 869.0, 1427.0, 2291.0, 3905.0, 7545.0, 16775.0, 48818.0, 246793.0, 578209.0, 90315.0, 25894.0, 10732.0, 5056.0, 2949.0, 1746.0, 1094.0, 707.0, 445.0, 322.0, 222.0, 151.0, 124.0, 72.0, 55.0, 28.0, 38.0, 16.0, 11.0, 11.0, 12.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-18.65625, -18.1265869140625, -17.596923828125, -17.0672607421875, -16.53759765625, -16.0079345703125, -15.478271484375, -14.9486083984375, -14.4189453125, -13.8892822265625, -13.359619140625, -12.8299560546875, -12.30029296875, -11.7706298828125, -11.240966796875, -10.7113037109375, -10.181640625, -9.6519775390625, -9.122314453125, -8.5926513671875, -8.06298828125, -7.5333251953125, -7.003662109375, -6.4739990234375, -5.9443359375, -5.4146728515625, -4.885009765625, -4.3553466796875, -3.82568359375, -3.2960205078125, -2.766357421875, -2.2366943359375, -1.70703125, -1.1773681640625, -0.647705078125, -0.1180419921875, 0.41162109375, 0.9412841796875, 1.470947265625, 2.0006103515625, 2.5302734375, 3.0599365234375, 3.589599609375, 4.1192626953125, 4.64892578125, 5.1785888671875, 5.708251953125, 6.2379150390625, 6.767578125, 7.2972412109375, 7.826904296875, 8.3565673828125, 8.88623046875, 9.4158935546875, 9.945556640625, 10.4752197265625, 11.0048828125, 11.5345458984375, 12.064208984375, 12.5938720703125, 13.12353515625, 13.6531982421875, 14.182861328125, 14.7125244140625, 15.2421875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 2.0, 4.0, 7.0, 10.0, 10.0, 12.0, 20.0, 15.0, 25.0, 33.0, 33.0, 38.0, 44.0, 54.0, 86.0, 106.0, 231.0, 1662.0, 180.0, 93.0, 72.0, 42.0, 55.0, 32.0, 36.0, 29.0, 22.0, 16.0, 19.0, 11.0, 15.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.29736328125, -34.9697265625, -33.64208984375, -32.314453125, -30.98681640625, -29.6591796875, -28.33154296875, -27.00390625, -25.67626953125, -24.3486328125, -23.02099609375, -21.693359375, -20.36572265625, -19.0380859375, -17.71044921875, -16.3828125, -15.05517578125, -13.7275390625, -12.39990234375, -11.072265625, -9.74462890625, -8.4169921875, -7.08935546875, -5.76171875, -4.43408203125, -3.1064453125, -1.77880859375, -0.451171875, 0.87646484375, 2.2041015625, 3.53173828125, 4.859375, 6.18701171875, 7.5146484375, 8.84228515625, 10.169921875, 11.49755859375, 12.8251953125, 14.15283203125, 15.48046875, 16.80810546875, 18.1357421875, 19.46337890625, 20.791015625, 22.11865234375, 23.4462890625, 24.77392578125, 26.1015625, 27.42919921875, 28.7568359375, 30.08447265625, 31.412109375, 32.73974609375, 34.0673828125, 35.39501953125, 36.72265625, 38.05029296875, 39.3779296875, 40.70556640625, 42.033203125, 43.36083984375, 44.6884765625, 46.01611328125, 47.34375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 15.0, 19.0, 27.0, 33.0, 52.0, 66.0, 73.0, 112.0, 198.0, 388.0, 1237.0, 9768.0, 761521.0, 2356929.0, 12689.0, 1465.0, 416.0, 170.0, 124.0, 96.0, 71.0, 39.0, 44.0, 34.0, 24.0, 17.0, 12.0, 7.0, 4.0, 6.0, 11.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-84.8125, -82.4599609375, -80.107421875, -77.7548828125, -75.40234375, -73.0498046875, -70.697265625, -68.3447265625, -65.9921875, -63.6396484375, -61.287109375, -58.9345703125, -56.58203125, -54.2294921875, -51.876953125, -49.5244140625, -47.171875, -44.8193359375, -42.466796875, -40.1142578125, -37.76171875, -35.4091796875, -33.056640625, -30.7041015625, -28.3515625, -25.9990234375, -23.646484375, -21.2939453125, -18.94140625, -16.5888671875, -14.236328125, -11.8837890625, -9.53125, -7.1787109375, -4.826171875, -2.4736328125, -0.12109375, 2.2314453125, 4.583984375, 6.9365234375, 9.2890625, 11.6416015625, 13.994140625, 16.3466796875, 18.69921875, 21.0517578125, 23.404296875, 25.7568359375, 28.109375, 30.4619140625, 32.814453125, 35.1669921875, 37.51953125, 39.8720703125, 42.224609375, 44.5771484375, 46.9296875, 49.2822265625, 51.634765625, 53.9873046875, 56.33984375, 58.6923828125, 61.044921875, 63.3974609375, 65.75]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 266.0, 751.0], "bins": [-1739.109375, -1711.553466796875, -1683.9976806640625, -1656.4417724609375, -1628.8858642578125, -1601.3299560546875, -1573.774169921875, -1546.21826171875, -1518.662353515625, -1491.1064453125, -1463.5506591796875, -1435.9947509765625, -1408.4388427734375, -1380.8829345703125, -1353.3271484375, -1325.771240234375, -1298.21533203125, -1270.659423828125, -1243.1036376953125, -1215.5477294921875, -1187.9918212890625, -1160.4359130859375, -1132.880126953125, -1105.32421875, -1077.7684326171875, -1050.2125244140625, -1022.6566772460938, -995.100830078125, -967.544921875, -939.9890747070312, -912.4332275390625, -884.8773193359375, -857.3213500976562, -829.7655029296875, -802.2095947265625, -774.6537475585938, -747.0978393554688, -719.5419921875, -691.986083984375, -664.4302368164062, -636.8743896484375, -609.3185424804688, -581.7626342773438, -554.206787109375, -526.65087890625, -499.09503173828125, -471.5391540527344, -443.9832763671875, -416.4273986816406, -388.87152099609375, -361.3156433105469, -333.759765625, -306.20391845703125, -278.64801025390625, -251.0921630859375, -223.53628540039062, -195.9803924560547, -168.4245147705078, -140.86865234375, -113.31277465820312, -85.75689697265625, -58.201019287109375, -30.645156860351562, -3.0892791748046875, 24.466596603393555]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 11.0, 7.0, 7.0, 12.0, 10.0, 10.0, 10.0, 22.0, 16.0, 32.0, 28.0, 36.0, 34.0, 44.0, 38.0, 36.0, 48.0, 30.0, 39.0, 49.0, 37.0, 42.0, 38.0, 37.0, 40.0, 36.0, 36.0, 25.0, 37.0, 19.0, 21.0, 17.0, 16.0, 12.0, 12.0, 10.0, 10.0, 15.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.80767822265625, -81.05241394042969, -78.29714965820312, -75.5418930053711, -72.78662872314453, -70.03136444091797, -67.27610778808594, -64.52084350585938, -61.76557922363281, -59.01031494140625, -56.25505447387695, -53.499794006347656, -50.744529724121094, -47.98926544189453, -45.234004974365234, -42.47874450683594, -39.723480224609375, -36.96821594238281, -34.212955474853516, -31.457693099975586, -28.702430725097656, -25.947168350219727, -23.191905975341797, -20.436643600463867, -17.681381225585938, -14.926118850708008, -12.170856475830078, -9.415594100952148, -6.660331726074219, -3.905069351196289, -1.1498069763183594, 1.6054553985595703, 4.3607177734375, 7.11598014831543, 9.87124252319336, 12.626504898071289, 15.381767272949219, 18.13702964782715, 20.892292022705078, 23.647554397583008, 26.402816772460938, 29.158079147338867, 31.913341522216797, 34.668601989746094, 37.423866271972656, 40.17913055419922, 42.934391021728516, 45.68965148925781, 48.444915771484375, 51.20018005371094, 53.955440521240234, 56.71070098876953, 59.465965270996094, 62.221229553222656, 64.97648620605469, 67.73175048828125, 70.48701477050781, 73.24227905273438, 75.99754333496094, 78.75279998779297, 81.50806427001953, 84.2633285522461, 87.01858520507812, 89.77384948730469, 92.52911376953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 2.0, 3.0, 6.0, 11.0, 11.0, 9.0, 16.0, 16.0, 20.0, 17.0, 20.0, 32.0, 23.0, 32.0, 29.0, 40.0, 31.0, 42.0, 50.0, 53.0, 41.0, 42.0, 46.0, 46.0, 49.0, 42.0, 31.0, 28.0, 30.0, 27.0, 17.0, 17.0, 20.0, 16.0, 15.0, 19.0, 11.0, 6.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8046875, -11.4803466796875, -11.156005859375, -10.8316650390625, -10.50732421875, -10.1829833984375, -9.858642578125, -9.5343017578125, -9.2099609375, -8.8856201171875, -8.561279296875, -8.2369384765625, -7.91259765625, -7.5882568359375, -7.263916015625, -6.9395751953125, -6.615234375, -6.2908935546875, -5.966552734375, -5.6422119140625, -5.31787109375, -4.9935302734375, -4.669189453125, -4.3448486328125, -4.0205078125, -3.6961669921875, -3.371826171875, -3.0474853515625, -2.72314453125, -2.3988037109375, -2.074462890625, -1.7501220703125, -1.42578125, -1.1014404296875, -0.777099609375, -0.4527587890625, -0.12841796875, 0.1959228515625, 0.520263671875, 0.8446044921875, 1.1689453125, 1.4932861328125, 1.817626953125, 2.1419677734375, 2.46630859375, 2.7906494140625, 3.114990234375, 3.4393310546875, 3.763671875, 4.0880126953125, 4.412353515625, 4.7366943359375, 5.06103515625, 5.3853759765625, 5.709716796875, 6.0340576171875, 6.3583984375, 6.6827392578125, 7.007080078125, 7.3314208984375, 7.65576171875, 7.9801025390625, 8.304443359375, 8.6287841796875, 8.953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 5.0, 12.0, 10.0, 21.0, 24.0, 27.0, 33.0, 46.0, 66.0, 96.0, 192.0, 257.0, 472.0, 994.0, 2276.0, 5838.0, 18281.0, 221331.0, 3653669.0, 261517.0, 19055.0, 5786.0, 2169.0, 935.0, 429.0, 262.0, 119.0, 85.0, 62.0, 47.0, 28.0, 30.0, 17.0, 26.0, 15.0, 8.0, 3.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -46.10791015625, -44.8095703125, -43.51123046875, -42.212890625, -40.91455078125, -39.6162109375, -38.31787109375, -37.01953125, -35.72119140625, -34.4228515625, -33.12451171875, -31.826171875, -30.52783203125, -29.2294921875, -27.93115234375, -26.6328125, -25.33447265625, -24.0361328125, -22.73779296875, -21.439453125, -20.14111328125, -18.8427734375, -17.54443359375, -16.24609375, -14.94775390625, -13.6494140625, -12.35107421875, -11.052734375, -9.75439453125, -8.4560546875, -7.15771484375, -5.859375, -4.56103515625, -3.2626953125, -1.96435546875, -0.666015625, 0.63232421875, 1.9306640625, 3.22900390625, 4.52734375, 5.82568359375, 7.1240234375, 8.42236328125, 9.720703125, 11.01904296875, 12.3173828125, 13.61572265625, 14.9140625, 16.21240234375, 17.5107421875, 18.80908203125, 20.107421875, 21.40576171875, 22.7041015625, 24.00244140625, 25.30078125, 26.59912109375, 27.8974609375, 29.19580078125, 30.494140625, 31.79248046875, 33.0908203125, 34.38916015625, 35.6875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 11.0, 6.0, 16.0, 11.0, 18.0, 22.0, 30.0, 37.0, 56.0, 95.0, 166.0, 329.0, 648.0, 833.0, 773.0, 420.0, 222.0, 125.0, 61.0, 41.0, 36.0, 20.0, 19.0, 21.0, 19.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.166015625, -32.23828125, -31.310546875, -30.3828125, -29.455078125, -28.52734375, -27.599609375, -26.671875, -25.744140625, -24.81640625, -23.888671875, -22.9609375, -22.033203125, -21.10546875, -20.177734375, -19.25, -18.322265625, -17.39453125, -16.466796875, -15.5390625, -14.611328125, -13.68359375, -12.755859375, -11.828125, -10.900390625, -9.97265625, -9.044921875, -8.1171875, -7.189453125, -6.26171875, -5.333984375, -4.40625, -3.478515625, -2.55078125, -1.623046875, -0.6953125, 0.232421875, 1.16015625, 2.087890625, 3.015625, 3.943359375, 4.87109375, 5.798828125, 6.7265625, 7.654296875, 8.58203125, 9.509765625, 10.4375, 11.365234375, 12.29296875, 13.220703125, 14.1484375, 15.076171875, 16.00390625, 16.931640625, 17.859375, 18.787109375, 19.71484375, 20.642578125, 21.5703125, 22.498046875, 23.42578125, 24.353515625, 25.28125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 12.0, 18.0, 31.0, 28.0, 48.0, 96.0, 175.0, 447.0, 1269.0, 4109.0, 18060.0, 158441.0, 3820213.0, 166582.0, 18326.0, 4249.0, 1276.0, 438.0, 178.0, 105.0, 51.0, 22.0, 19.0, 20.0, 19.0, 7.0, 11.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.59375, -53.57275390625, -51.5517578125, -49.53076171875, -47.509765625, -45.48876953125, -43.4677734375, -41.44677734375, -39.42578125, -37.40478515625, -35.3837890625, -33.36279296875, -31.341796875, -29.32080078125, -27.2998046875, -25.27880859375, -23.2578125, -21.23681640625, -19.2158203125, -17.19482421875, -15.173828125, -13.15283203125, -11.1318359375, -9.11083984375, -7.08984375, -5.06884765625, -3.0478515625, -1.02685546875, 0.994140625, 3.01513671875, 5.0361328125, 7.05712890625, 9.078125, 11.09912109375, 13.1201171875, 15.14111328125, 17.162109375, 19.18310546875, 21.2041015625, 23.22509765625, 25.24609375, 27.26708984375, 29.2880859375, 31.30908203125, 33.330078125, 35.35107421875, 37.3720703125, 39.39306640625, 41.4140625, 43.43505859375, 45.4560546875, 47.47705078125, 49.498046875, 51.51904296875, 53.5400390625, 55.56103515625, 57.58203125, 59.60302734375, 61.6240234375, 63.64501953125, 65.666015625, 67.68701171875, 69.7080078125, 71.72900390625, 73.75]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 12.0, 30.0, 25.0, 35.0, 64.0, 82.0, 110.0, 143.0, 130.0, 110.0, 88.0, 49.0, 40.0, 22.0, 22.0, 12.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.06134033203125, -50.48974609375, -46.91815185546875, -43.346561431884766, -39.774967193603516, -36.203372955322266, -32.63178253173828, -29.06018829345703, -25.48859405517578, -21.91699981689453, -18.345407485961914, -14.77381420135498, -11.202220916748047, -7.630626678466797, -4.05903434753418, -0.4874420166015625, 3.0841522216796875, 6.655745506286621, 10.227338790893555, 13.798932075500488, 17.370525360107422, 20.942119598388672, 24.51371192932129, 28.085304260253906, 31.656898498535156, 35.228492736816406, 38.800086975097656, 42.37167739868164, 45.94327163696289, 49.51486587524414, 53.086456298828125, 56.658050537109375, 60.229644775390625, 63.801239013671875, 67.37283325195312, 70.94442749023438, 74.51602172851562, 78.08761596679688, 81.6592025756836, 85.23079681396484, 88.8023910522461, 92.37398529052734, 95.9455795288086, 99.51717376708984, 103.08876037597656, 106.66035461425781, 110.23194885253906, 113.80354309082031, 117.37513732910156, 120.94673156738281, 124.51832580566406, 128.0899200439453, 131.66151428222656, 135.2331085205078, 138.80470275878906, 142.37628173828125, 145.9478759765625, 149.51947021484375, 153.091064453125, 156.66265869140625, 160.2342529296875, 163.80584716796875, 167.37744140625, 170.94903564453125, 174.5206298828125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 12.0, 17.0, 18.0, 20.0, 13.0, 20.0, 16.0, 26.0, 24.0, 23.0, 22.0, 31.0, 40.0, 40.0, 34.0, 36.0, 35.0, 41.0, 36.0, 41.0, 40.0, 34.0, 50.0, 34.0, 34.0, 34.0, 29.0, 18.0, 14.0, 24.0, 19.0, 9.0, 19.0, 18.0, 9.0, 7.0, 5.0, 6.0, 4.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-70.21063995361328, -68.07457733154297, -65.93851470947266, -63.802452087402344, -61.6663932800293, -59.530330657958984, -57.39426803588867, -55.25820541381836, -53.12214660644531, -50.986083984375, -48.85002136230469, -46.713958740234375, -44.57789993286133, -42.441837310791016, -40.3057746887207, -38.16971206665039, -36.03364944458008, -33.897586822509766, -31.761526107788086, -29.625463485717773, -27.489402770996094, -25.35334014892578, -23.21727752685547, -21.081214904785156, -18.945154190063477, -16.809091567993164, -14.673030853271484, -12.536968231201172, -10.400906562805176, -8.26484489440918, -6.128782272338867, -3.992720603942871, -1.856658935546875, 0.2794029712677002, 2.4154648780822754, 4.55152702331543, 6.687588691711426, 8.823650360107422, 10.959712982177734, 13.09577465057373, 15.231836318969727, 17.36789894104004, 19.50395965576172, 21.64002227783203, 23.776084899902344, 25.912145614624023, 28.048208236694336, 30.184268951416016, 32.32033157348633, 34.45639419555664, 36.59245681762695, 38.728515625, 40.86457824707031, 43.000640869140625, 45.13670349121094, 47.27276611328125, 49.40882873535156, 51.544891357421875, 53.68095397949219, 55.8170166015625, 57.95307540893555, 60.08913803100586, 62.22520065307617, 64.36125946044922, 66.49732208251953]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 15.0, 18.0, 30.0, 42.0, 77.0, 97.0, 165.0, 222.0, 309.0, 433.0, 668.0, 907.0, 1284.0, 1815.0, 2550.0, 3673.0, 5007.0, 7467.0, 10665.0, 15277.0, 22079.0, 32237.0, 48584.0, 73283.0, 114971.0, 178679.0, 180405.0, 116513.0, 74597.0, 49311.0, 33248.0, 22388.0, 15369.0, 10885.0, 7527.0, 5285.0, 3703.0, 2666.0, 1840.0, 1258.0, 956.0, 685.0, 436.0, 307.0, 197.0, 125.0, 120.0, 76.0, 39.0, 14.0, 14.0, 19.0, 9.0, 6.0, 2.0, 3.0], "bins": [-0.211669921875, -0.20544815063476562, -0.19922637939453125, -0.19300460815429688, -0.1867828369140625, -0.18056106567382812, -0.17433929443359375, -0.16811752319335938, -0.161895751953125, -0.15567398071289062, -0.14945220947265625, -0.14323043823242188, -0.1370086669921875, -0.13078689575195312, -0.12456512451171875, -0.11834335327148438, -0.11212158203125, -0.10589981079101562, -0.09967803955078125, -0.09345626831054688, -0.0872344970703125, -0.08101272583007812, -0.07479095458984375, -0.06856918334960938, -0.062347412109375, -0.056125640869140625, -0.04990386962890625, -0.043682098388671875, -0.0374603271484375, -0.031238555908203125, -0.02501678466796875, -0.018795013427734375, -0.0125732421875, -0.006351470947265625, -0.00012969970703125, 0.006092071533203125, 0.0123138427734375, 0.018535614013671875, 0.02475738525390625, 0.030979156494140625, 0.037200927734375, 0.043422698974609375, 0.04964447021484375, 0.055866241455078125, 0.0620880126953125, 0.06830978393554688, 0.07453155517578125, 0.08075332641601562, 0.08697509765625, 0.09319686889648438, 0.09941864013671875, 0.10564041137695312, 0.1118621826171875, 0.11808395385742188, 0.12430572509765625, 0.13052749633789062, 0.136749267578125, 0.14297103881835938, 0.14919281005859375, 0.15541458129882812, 0.1616363525390625, 0.16785812377929688, 0.17407989501953125, 0.18030166625976562, 0.1865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 8.0, 8.0, 13.0, 14.0, 15.0, 19.0, 25.0, 28.0, 28.0, 31.0, 42.0, 29.0, 34.0, 38.0, 44.0, 39.0, 39.0, 1077.0, 47.0, 45.0, 42.0, 42.0, 43.0, 28.0, 33.0, 30.0, 21.0, 28.0, 18.0, 13.0, 11.0, 15.0, 14.0, 7.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.234375, -6.9774169921875, -6.720458984375, -6.4635009765625, -6.20654296875, -5.9495849609375, -5.692626953125, -5.4356689453125, -5.1787109375, -4.9217529296875, -4.664794921875, -4.4078369140625, -4.15087890625, -3.8939208984375, -3.636962890625, -3.3800048828125, -3.123046875, -2.8660888671875, -2.609130859375, -2.3521728515625, -2.09521484375, -1.8382568359375, -1.581298828125, -1.3243408203125, -1.0673828125, -0.8104248046875, -0.553466796875, -0.2965087890625, -0.03955078125, 0.2174072265625, 0.474365234375, 0.7313232421875, 0.98828125, 1.2452392578125, 1.502197265625, 1.7591552734375, 2.01611328125, 2.2730712890625, 2.530029296875, 2.7869873046875, 3.0439453125, 3.3009033203125, 3.557861328125, 3.8148193359375, 4.07177734375, 4.3287353515625, 4.585693359375, 4.8426513671875, 5.099609375, 5.3565673828125, 5.613525390625, 5.8704833984375, 6.12744140625, 6.3843994140625, 6.641357421875, 6.8983154296875, 7.1552734375, 7.4122314453125, 7.669189453125, 7.9261474609375, 8.18310546875, 8.4400634765625, 8.697021484375, 8.9539794921875, 9.2109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 21.0, 25.0, 42.0, 67.0, 91.0, 125.0, 213.0, 281.0, 399.0, 617.0, 870.0, 1297.0, 1905.0, 2792.0, 4256.0, 6508.0, 9810.0, 14706.0, 22952.0, 35822.0, 55471.0, 91191.0, 152594.0, 1269645.0, 161718.0, 96723.0, 59217.0, 37749.0, 24023.0, 15623.0, 10245.0, 6714.0, 4399.0, 2856.0, 1891.0, 1326.0, 871.0, 654.0, 427.0, 301.0, 211.0, 150.0, 111.0, 64.0, 43.0, 40.0, 15.0, 16.0, 7.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.110107421875, -0.10650444030761719, -0.10290145874023438, -0.09929847717285156, -0.09569549560546875, -0.09209251403808594, -0.08848953247070312, -0.08488655090332031, -0.0812835693359375, -0.07768058776855469, -0.07407760620117188, -0.07047462463378906, -0.06687164306640625, -0.06326866149902344, -0.059665679931640625, -0.05606269836425781, -0.052459716796875, -0.04885673522949219, -0.045253753662109375, -0.04165077209472656, -0.03804779052734375, -0.03444480895996094, -0.030841827392578125, -0.027238845825195312, -0.0236358642578125, -0.020032882690429688, -0.016429901123046875, -0.012826919555664062, -0.00922393798828125, -0.0056209564208984375, -0.002017974853515625, 0.0015850067138671875, 0.00518798828125, 0.008790969848632812, 0.012393951416015625, 0.015996932983398438, 0.01959991455078125, 0.023202896118164062, 0.026805877685546875, 0.030408859252929688, 0.0340118408203125, 0.03761482238769531, 0.041217803955078125, 0.04482078552246094, 0.04842376708984375, 0.05202674865722656, 0.055629730224609375, 0.05923271179199219, 0.062835693359375, 0.06643867492675781, 0.07004165649414062, 0.07364463806152344, 0.07724761962890625, 0.08085060119628906, 0.08445358276367188, 0.08805656433105469, 0.0916595458984375, 0.09526252746582031, 0.09886550903320312, 0.10246849060058594, 0.10607147216796875, 0.10967445373535156, 0.11327743530273438, 0.11688041687011719, 0.1204833984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 10.0, 9.0, 14.0, 15.0, 16.0, 15.0, 35.0, 36.0, 50.0, 39.0, 72.0, 73.0, 74.0, 76.0, 68.0, 68.0, 55.0, 54.0, 45.0, 27.0, 28.0, 20.0, 17.0, 18.0, 11.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0013179779052734375, -0.0012768656015396118, -0.0012357532978057861, -0.0011946409940719604, -0.0011535286903381348, -0.001112416386604309, -0.0010713040828704834, -0.0010301917791366577, -0.000989079475402832, -0.0009479671716690063, -0.0009068548679351807, -0.000865742564201355, -0.0008246302604675293, -0.0007835179567337036, -0.0007424056529998779, -0.0007012933492660522, -0.0006601810455322266, -0.0006190687417984009, -0.0005779564380645752, -0.0005368441343307495, -0.0004957318305969238, -0.00045461952686309814, -0.00041350722312927246, -0.0003723949193954468, -0.0003312826156616211, -0.0002901703119277954, -0.0002490580081939697, -0.00020794570446014404, -0.00016683340072631836, -0.00012572109699249268, -8.460879325866699e-05, -4.349648952484131e-05, -2.384185791015625e-06, 3.872811794281006e-05, 7.984042167663574e-05, 0.00012095272541046143, 0.0001620650291442871, 0.0002031773328781128, 0.0002442896366119385, 0.00028540194034576416, 0.00032651424407958984, 0.00036762654781341553, 0.0004087388515472412, 0.0004498511552810669, 0.0004909634590148926, 0.0005320757627487183, 0.0005731880664825439, 0.0006143003702163696, 0.0006554126739501953, 0.000696524977684021, 0.0007376372814178467, 0.0007787495851516724, 0.000819861888885498, 0.0008609741926193237, 0.0009020864963531494, 0.0009431988000869751, 0.0009843111038208008, 0.0010254234075546265, 0.0010665357112884521, 0.0011076480150222778, 0.0011487603187561035, 0.0011898726224899292, 0.0012309849262237549, 0.0012720972299575806, 0.0013132095336914062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 10.0, 10.0, 14.0, 21.0, 23.0, 34.0, 35.0, 66.0, 116.0, 206.0, 445.0, 1739.0, 931753.0, 112000.0, 1200.0, 391.0, 164.0, 77.0, 75.0, 40.0, 18.0, 23.0, 15.0, 15.0, 9.0, 10.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.026988983154296875, -0.02611541748046875, -0.025241851806640625, -0.0243682861328125, -0.023494720458984375, -0.02262115478515625, -0.021747589111328125, -0.0208740234375, -0.020000457763671875, -0.01912689208984375, -0.018253326416015625, -0.0173797607421875, -0.016506195068359375, -0.01563262939453125, -0.014759063720703125, -0.013885498046875, -0.013011932373046875, -0.01213836669921875, -0.011264801025390625, -0.0103912353515625, -0.009517669677734375, -0.00864410400390625, -0.007770538330078125, -0.00689697265625, -0.006023406982421875, -0.00514984130859375, -0.004276275634765625, -0.0034027099609375, -0.002529144287109375, -0.00165557861328125, -0.000782012939453125, 9.1552734375e-05, 0.000965118408203125, 0.00183868408203125, 0.002712249755859375, 0.0035858154296875, 0.004459381103515625, 0.00533294677734375, 0.006206512451171875, 0.007080078125, 0.007953643798828125, 0.00882720947265625, 0.009700775146484375, 0.0105743408203125, 0.011447906494140625, 0.01232147216796875, 0.013195037841796875, 0.014068603515625, 0.014942169189453125, 0.01581573486328125, 0.016689300537109375, 0.0175628662109375, 0.018436431884765625, 0.01930999755859375, 0.020183563232421875, 0.02105712890625, 0.021930694580078125, 0.02280426025390625, 0.023677825927734375, 0.0245513916015625, 0.025424957275390625, 0.02629852294921875, 0.027172088623046875, 0.028045654296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 28.0, 967.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03016747534275055, -0.02961399033665657, -0.029060503467917442, -0.028507018461823463, -0.027953531593084335, -0.027400046586990356, -0.02684655971825123, -0.02629307471215725, -0.02573958784341812, -0.025186102837324142, -0.024632615968585014, -0.024079130962491035, -0.023525644093751907, -0.02297215908765793, -0.0224186722189188, -0.02186518721282482, -0.021311702206730843, -0.020758217200636864, -0.020204730331897736, -0.019651245325803757, -0.01909775845706463, -0.01854427345097065, -0.01799078658223152, -0.017437301576137543, -0.016883816570043564, -0.016330331563949585, -0.015776844695210457, -0.015223358757793903, -0.01466987282037735, -0.014116387814283371, -0.013562901876866817, -0.013009415939450264, -0.012455929070711136, -0.011902443133294582, -0.011348957195878029, -0.010795471258461475, -0.010241985321044922, -0.009688500314950943, -0.00913501437753439, -0.008581528440117836, -0.008028042502701283, -0.007474556565284729, -0.0069210706278681755, -0.006367585156112909, -0.005814099218696356, -0.005260613281279802, -0.004707127809524536, -0.004153641872107983, -0.003600155934691429, -0.0030466699972748756, -0.002493184292688966, -0.0019396984716877341, -0.0013862126506865025, -0.000832726713269949, -0.0002792410086840391, 0.00027424469590187073, 0.0008277306333184242, 0.001381216454319656, 0.0019347022753208876, 0.0024881879799067974, 0.003041673917323351, 0.0035951598547399044, 0.004148645326495171, 0.004702131263911724, 0.005255617201328278]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 8.0, 8.0, 17.0, 21.0, 17.0, 25.0, 25.0, 28.0, 37.0, 47.0, 36.0, 37.0, 41.0, 44.0, 36.0, 47.0, 44.0, 53.0, 50.0, 39.0, 50.0, 28.0, 41.0, 26.0, 26.0, 27.0, 25.0, 15.0, 18.0, 10.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010303258895874023, -0.0009916974231600761, -0.0009530689567327499, -0.0009144404903054237, -0.0008758120238780975, -0.0008371835574507713, -0.0007985550910234451, -0.0007599266245961189, -0.0007212981581687927, -0.0006826696917414665, -0.0006440412253141403, -0.0006054127588868141, -0.0005667842924594879, -0.0005281558260321617, -0.0004895273596048355, -0.0004508988931775093, -0.0004122704267501831, -0.0003736419603228569, -0.0003350134938955307, -0.0002963850274682045, -0.0002577565610408783, -0.0002191280946135521, -0.0001804996281862259, -0.0001418711617588997, -0.00010324269533157349, -6.461422890424728e-05, -2.598576247692108e-05, 1.2642703950405121e-05, 5.127117037773132e-05, 8.989963680505753e-05, 0.00012852810323238373, 0.00016715656965970993, 0.00020578503608703613, 0.00024441350251436234, 0.00028304196894168854, 0.00032167043536901474, 0.00036029890179634094, 0.00039892736822366714, 0.00043755583465099335, 0.00047618430107831955, 0.0005148127675056458, 0.000553441233932972, 0.0005920697003602982, 0.0006306981667876244, 0.0006693266332149506, 0.0007079550996422768, 0.000746583566069603, 0.0007852120324969292, 0.0008238404989242554, 0.0008624689653515816, 0.0009010974317789078, 0.000939725898206234, 0.0009783543646335602, 0.0010169828310608864, 0.0010556112974882126, 0.0010942397639155388, 0.001132868230342865, 0.0011714966967701912, 0.0012101251631975174, 0.0012487536296248436, 0.0012873820960521698, 0.001326010562479496, 0.0013646390289068222, 0.0014032674953341484, 0.0014418959617614746]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 18.0, 20.0, 27.0, 33.0, 52.0, 66.0, 106.0, 152.0, 215.0, 267.0, 434.0, 598.0, 917.0, 1269.0, 2167.0, 3378.0, 5230.0, 8896.0, 16607.0, 39525.0, 225401.0, 622552.0, 68457.0, 22757.0, 11284.0, 6499.0, 3900.0, 2588.0, 1620.0, 1113.0, 718.0, 507.0, 368.0, 247.0, 182.0, 103.0, 96.0, 48.0, 37.0, 29.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.787109375, -18.12109375, -17.455078125, -16.7890625, -16.123046875, -15.45703125, -14.791015625, -14.125, -13.458984375, -12.79296875, -12.126953125, -11.4609375, -10.794921875, -10.12890625, -9.462890625, -8.796875, -8.130859375, -7.46484375, -6.798828125, -6.1328125, -5.466796875, -4.80078125, -4.134765625, -3.46875, -2.802734375, -2.13671875, -1.470703125, -0.8046875, -0.138671875, 0.52734375, 1.193359375, 1.859375, 2.525390625, 3.19140625, 3.857421875, 4.5234375, 5.189453125, 5.85546875, 6.521484375, 7.1875, 7.853515625, 8.51953125, 9.185546875, 9.8515625, 10.517578125, 11.18359375, 11.849609375, 12.515625, 13.181640625, 13.84765625, 14.513671875, 15.1796875, 15.845703125, 16.51171875, 17.177734375, 17.84375, 18.509765625, 19.17578125, 19.841796875, 20.5078125, 21.173828125, 21.83984375, 22.505859375, 23.171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 4.0, 6.0, 8.0, 6.0, 11.0, 16.0, 17.0, 13.0, 22.0, 21.0, 29.0, 32.0, 37.0, 34.0, 39.0, 39.0, 54.0, 58.0, 104.0, 287.0, 1579.0, 138.0, 70.0, 43.0, 34.0, 42.0, 32.0, 29.0, 33.0, 25.0, 23.0, 17.0, 19.0, 23.0, 10.0, 17.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-30.859375, -29.956298828125, -29.05322265625, -28.150146484375, -27.2470703125, -26.343994140625, -25.44091796875, -24.537841796875, -23.634765625, -22.731689453125, -21.82861328125, -20.925537109375, -20.0224609375, -19.119384765625, -18.21630859375, -17.313232421875, -16.41015625, -15.507080078125, -14.60400390625, -13.700927734375, -12.7978515625, -11.894775390625, -10.99169921875, -10.088623046875, -9.185546875, -8.282470703125, -7.37939453125, -6.476318359375, -5.5732421875, -4.670166015625, -3.76708984375, -2.864013671875, -1.9609375, -1.057861328125, -0.15478515625, 0.748291015625, 1.6513671875, 2.554443359375, 3.45751953125, 4.360595703125, 5.263671875, 6.166748046875, 7.06982421875, 7.972900390625, 8.8759765625, 9.779052734375, 10.68212890625, 11.585205078125, 12.48828125, 13.391357421875, 14.29443359375, 15.197509765625, 16.1005859375, 17.003662109375, 17.90673828125, 18.809814453125, 19.712890625, 20.615966796875, 21.51904296875, 22.422119140625, 23.3251953125, 24.228271484375, 25.13134765625, 26.034423828125, 26.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 3.0, 6.0, 5.0, 4.0, 2.0, 10.0, 8.0, 9.0, 2.0, 17.0, 13.0, 18.0, 30.0, 24.0, 27.0, 37.0, 45.0, 54.0, 91.0, 123.0, 243.0, 454.0, 1152.0, 3349.0, 12321.0, 88925.0, 2947977.0, 73954.0, 11136.0, 3324.0, 1153.0, 433.0, 201.0, 134.0, 92.0, 68.0, 50.0, 38.0, 26.0, 30.0, 18.0, 16.0, 22.0, 15.0, 9.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-49.90625, -48.1533203125, -46.400390625, -44.6474609375, -42.89453125, -41.1416015625, -39.388671875, -37.6357421875, -35.8828125, -34.1298828125, -32.376953125, -30.6240234375, -28.87109375, -27.1181640625, -25.365234375, -23.6123046875, -21.859375, -20.1064453125, -18.353515625, -16.6005859375, -14.84765625, -13.0947265625, -11.341796875, -9.5888671875, -7.8359375, -6.0830078125, -4.330078125, -2.5771484375, -0.82421875, 0.9287109375, 2.681640625, 4.4345703125, 6.1875, 7.9404296875, 9.693359375, 11.4462890625, 13.19921875, 14.9521484375, 16.705078125, 18.4580078125, 20.2109375, 21.9638671875, 23.716796875, 25.4697265625, 27.22265625, 28.9755859375, 30.728515625, 32.4814453125, 34.234375, 35.9873046875, 37.740234375, 39.4931640625, 41.24609375, 42.9990234375, 44.751953125, 46.5048828125, 48.2578125, 50.0107421875, 51.763671875, 53.5166015625, 55.26953125, 57.0224609375, 58.775390625, 60.5283203125, 62.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 33.0, 162.0, 486.0, 261.0, 59.0, 11.0], "bins": [-482.2396240234375, -474.2826232910156, -466.32562255859375, -458.36865234375, -450.4116516113281, -442.45465087890625, -434.4976501464844, -426.5406799316406, -418.58367919921875, -410.6266784667969, -402.669677734375, -394.71270751953125, -386.7557067871094, -378.7987060546875, -370.8417053222656, -362.8847351074219, -354.927734375, -346.9707336425781, -339.01373291015625, -331.0567626953125, -323.0997619628906, -315.14276123046875, -307.1857604980469, -299.2287902832031, -291.27178955078125, -283.3147888183594, -275.3577880859375, -267.40081787109375, -259.4438171386719, -251.48681640625, -243.5298309326172, -235.5728302001953, -227.61582946777344, -219.65882873535156, -211.70184326171875, -203.74484252929688, -195.78785705566406, -187.8308563232422, -179.87387084960938, -171.9168701171875, -163.9598846435547, -156.0028839111328, -148.0458984375, -140.08889770507812, -132.1319122314453, -124.17491149902344, -116.21792602539062, -108.26092529296875, -100.3039321899414, -92.34693908691406, -84.38994598388672, -76.43295288085938, -68.47595977783203, -60.51896286010742, -52.56196975708008, -44.604976654052734, -36.64798355102539, -28.690990447998047, -20.733997344970703, -12.777002334594727, -4.820009231567383, 3.1369857788085938, 11.093978881835938, 19.05097198486328, 27.007965087890625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 11.0, 18.0, 27.0, 24.0, 14.0, 31.0, 37.0, 30.0, 35.0, 38.0, 43.0, 55.0, 46.0, 44.0, 46.0, 44.0, 45.0, 41.0, 37.0, 29.0, 28.0, 33.0, 43.0, 29.0, 21.0, 19.0, 17.0, 22.0, 4.0, 14.0, 7.0, 10.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.95658111572266, -89.61892700195312, -86.28126525878906, -82.94361114501953, -79.60595703125, -76.26829528808594, -72.9306411743164, -69.59298706054688, -66.25532531738281, -62.917667388916016, -59.58000946044922, -56.24235534667969, -52.90469741821289, -49.567039489746094, -46.22938537597656, -42.891727447509766, -39.55406951904297, -36.21641159057617, -32.878753662109375, -29.541099548339844, -26.203441619873047, -22.86578369140625, -19.528127670288086, -16.190471649169922, -12.852813720703125, -9.515156745910645, -6.177499771118164, -2.8398427963256836, 0.4978141784667969, 3.8354721069335938, 7.173128128051758, 10.510784149169922, 13.84844970703125, 17.186107635498047, 20.52376365661621, 23.861419677734375, 27.199077606201172, 30.53673553466797, 33.8743896484375, 37.2120475769043, 40.549705505371094, 43.88736343383789, 47.22502136230469, 50.56267547607422, 53.900333404541016, 57.23799133300781, 60.575645446777344, 63.91330337524414, 67.25096130371094, 70.58861541748047, 73.92627716064453, 77.26393127441406, 80.60159301757812, 83.93924713134766, 87.27690124511719, 90.61456298828125, 93.95221710205078, 97.28987121582031, 100.62753295898438, 103.9651870727539, 107.30284118652344, 110.6405029296875, 113.97815704345703, 117.31581115722656, 120.65347290039062]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 8.0, 12.0, 10.0, 14.0, 12.0, 15.0, 18.0, 25.0, 20.0, 28.0, 33.0, 38.0, 24.0, 34.0, 37.0, 41.0, 47.0, 37.0, 46.0, 31.0, 38.0, 32.0, 29.0, 40.0, 55.0, 26.0, 35.0, 34.0, 18.0, 20.0, 15.0, 13.0, 14.0, 17.0, 19.0, 9.0, 6.0, 6.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.03125, -10.7103271484375, -10.389404296875, -10.0684814453125, -9.74755859375, -9.4266357421875, -9.105712890625, -8.7847900390625, -8.4638671875, -8.1429443359375, -7.822021484375, -7.5010986328125, -7.18017578125, -6.8592529296875, -6.538330078125, -6.2174072265625, -5.896484375, -5.5755615234375, -5.254638671875, -4.9337158203125, -4.61279296875, -4.2918701171875, -3.970947265625, -3.6500244140625, -3.3291015625, -3.0081787109375, -2.687255859375, -2.3663330078125, -2.04541015625, -1.7244873046875, -1.403564453125, -1.0826416015625, -0.76171875, -0.4407958984375, -0.119873046875, 0.2010498046875, 0.52197265625, 0.8428955078125, 1.163818359375, 1.4847412109375, 1.8056640625, 2.1265869140625, 2.447509765625, 2.7684326171875, 3.08935546875, 3.4102783203125, 3.731201171875, 4.0521240234375, 4.373046875, 4.6939697265625, 5.014892578125, 5.3358154296875, 5.65673828125, 5.9776611328125, 6.298583984375, 6.6195068359375, 6.9404296875, 7.2613525390625, 7.582275390625, 7.9031982421875, 8.22412109375, 8.5450439453125, 8.865966796875, 9.1868896484375, 9.5078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 10.0, 15.0, 13.0, 9.0, 17.0, 19.0, 20.0, 34.0, 55.0, 82.0, 154.0, 246.0, 432.0, 856.0, 1734.0, 3905.0, 9767.0, 33470.0, 564452.0, 3260179.0, 280625.0, 24716.0, 7663.0, 3050.0, 1313.0, 612.0, 321.0, 161.0, 92.0, 56.0, 40.0, 34.0, 21.0, 13.0, 21.0, 12.0, 11.0, 9.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.25, -34.22509765625, -33.2001953125, -32.17529296875, -31.150390625, -30.12548828125, -29.1005859375, -28.07568359375, -27.05078125, -26.02587890625, -25.0009765625, -23.97607421875, -22.951171875, -21.92626953125, -20.9013671875, -19.87646484375, -18.8515625, -17.82666015625, -16.8017578125, -15.77685546875, -14.751953125, -13.72705078125, -12.7021484375, -11.67724609375, -10.65234375, -9.62744140625, -8.6025390625, -7.57763671875, -6.552734375, -5.52783203125, -4.5029296875, -3.47802734375, -2.453125, -1.42822265625, -0.4033203125, 0.62158203125, 1.646484375, 2.67138671875, 3.6962890625, 4.72119140625, 5.74609375, 6.77099609375, 7.7958984375, 8.82080078125, 9.845703125, 10.87060546875, 11.8955078125, 12.92041015625, 13.9453125, 14.97021484375, 15.9951171875, 17.02001953125, 18.044921875, 19.06982421875, 20.0947265625, 21.11962890625, 22.14453125, 23.16943359375, 24.1943359375, 25.21923828125, 26.244140625, 27.26904296875, 28.2939453125, 29.31884765625, 30.34375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 7.0, 6.0, 18.0, 8.0, 19.0, 24.0, 26.0, 37.0, 44.0, 69.0, 123.0, 141.0, 255.0, 444.0, 656.0, 797.0, 564.0, 310.0, 168.0, 106.0, 61.0, 36.0, 32.0, 25.0, 15.0, 18.0, 9.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.296875, -23.5146484375, -22.732421875, -21.9501953125, -21.16796875, -20.3857421875, -19.603515625, -18.8212890625, -18.0390625, -17.2568359375, -16.474609375, -15.6923828125, -14.91015625, -14.1279296875, -13.345703125, -12.5634765625, -11.78125, -10.9990234375, -10.216796875, -9.4345703125, -8.65234375, -7.8701171875, -7.087890625, -6.3056640625, -5.5234375, -4.7412109375, -3.958984375, -3.1767578125, -2.39453125, -1.6123046875, -0.830078125, -0.0478515625, 0.734375, 1.5166015625, 2.298828125, 3.0810546875, 3.86328125, 4.6455078125, 5.427734375, 6.2099609375, 6.9921875, 7.7744140625, 8.556640625, 9.3388671875, 10.12109375, 10.9033203125, 11.685546875, 12.4677734375, 13.25, 14.0322265625, 14.814453125, 15.5966796875, 16.37890625, 17.1611328125, 17.943359375, 18.7255859375, 19.5078125, 20.2900390625, 21.072265625, 21.8544921875, 22.63671875, 23.4189453125, 24.201171875, 24.9833984375, 25.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 10.0, 16.0, 17.0, 28.0, 35.0, 70.0, 118.0, 289.0, 926.0, 3886.0, 34057.0, 3632592.0, 504462.0, 14393.0, 2196.0, 577.0, 221.0, 128.0, 54.0, 36.0, 34.0, 22.0, 16.0, 13.0, 16.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-92.5625, -89.7431640625, -86.923828125, -84.1044921875, -81.28515625, -78.4658203125, -75.646484375, -72.8271484375, -70.0078125, -67.1884765625, -64.369140625, -61.5498046875, -58.73046875, -55.9111328125, -53.091796875, -50.2724609375, -47.453125, -44.6337890625, -41.814453125, -38.9951171875, -36.17578125, -33.3564453125, -30.537109375, -27.7177734375, -24.8984375, -22.0791015625, -19.259765625, -16.4404296875, -13.62109375, -10.8017578125, -7.982421875, -5.1630859375, -2.34375, 0.4755859375, 3.294921875, 6.1142578125, 8.93359375, 11.7529296875, 14.572265625, 17.3916015625, 20.2109375, 23.0302734375, 25.849609375, 28.6689453125, 31.48828125, 34.3076171875, 37.126953125, 39.9462890625, 42.765625, 45.5849609375, 48.404296875, 51.2236328125, 54.04296875, 56.8623046875, 59.681640625, 62.5009765625, 65.3203125, 68.1396484375, 70.958984375, 73.7783203125, 76.59765625, 79.4169921875, 82.236328125, 85.0556640625, 87.875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 22.0, 62.0, 279.0, 402.0, 168.0, 58.0, 16.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.2228393554688, -556.716796875, -545.2108154296875, -533.7047729492188, -522.19873046875, -510.6927490234375, -499.18670654296875, -487.6806945800781, -476.1746826171875, -464.6686706542969, -453.1626281738281, -441.6566162109375, -430.1506042480469, -418.64459228515625, -407.1385498046875, -395.6325378417969, -384.1264953613281, -372.6204833984375, -361.11444091796875, -349.6084289550781, -338.1024169921875, -326.59637451171875, -315.0903625488281, -303.5843505859375, -292.07830810546875, -280.5722961425781, -269.0662536621094, -257.56024169921875, -246.05422973632812, -234.54820251464844, -223.04217529296875, -211.53616333007812, -200.03016662597656, -188.52413940429688, -177.01812744140625, -165.51210021972656, -154.00607299804688, -142.50006103515625, -130.99403381347656, -119.4880142211914, -107.98199462890625, -96.4759750366211, -84.96995544433594, -73.46392822265625, -61.957908630371094, -50.45188903808594, -38.94586181640625, -27.439842224121094, -15.933822631835938, -4.427801132202148, 7.078220367431641, 18.584243774414062, 30.09026336669922, 41.596282958984375, 53.10231018066406, 64.60832977294922, 76.11434936523438, 87.62036895751953, 99.12638854980469, 110.63241577148438, 122.13843536376953, 133.6444549560547, 145.15048217773438, 156.656494140625, 168.1625213623047]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 12.0, 9.0, 10.0, 8.0, 15.0, 13.0, 10.0, 24.0, 21.0, 13.0, 30.0, 16.0, 20.0, 28.0, 26.0, 29.0, 44.0, 39.0, 36.0, 46.0, 24.0, 37.0, 31.0, 33.0, 41.0, 29.0, 48.0, 37.0, 35.0, 31.0, 28.0, 22.0, 25.0, 18.0, 21.0, 16.0, 16.0, 6.0, 15.0, 3.0, 13.0, 6.0, 2.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-74.22453308105469, -72.0906982421875, -69.95685577392578, -67.8230209350586, -65.6891860961914, -63.55534744262695, -61.4215087890625, -59.28767395019531, -57.15383529663086, -55.019996643066406, -52.88616180419922, -50.752323150634766, -48.61848449707031, -46.484649658203125, -44.35081100463867, -42.21697235107422, -40.08313751220703, -37.94929885864258, -35.81546401977539, -33.68162536621094, -31.547788619995117, -29.413951873779297, -27.280113220214844, -25.146276473999023, -23.012439727783203, -20.878602981567383, -18.744766235351562, -16.61092758178711, -14.477090835571289, -12.343254089355469, -10.209416389465332, -8.075578689575195, -5.941741943359375, -3.8079047203063965, -1.674067497253418, 0.45976972579956055, 2.593606948852539, 4.727443695068359, 6.861281394958496, 8.995119094848633, 11.128955841064453, 13.262792587280273, 15.39663028717041, 17.530467987060547, 19.664304733276367, 21.798141479492188, 23.93198013305664, 26.06581687927246, 28.19965362548828, 30.3334903717041, 32.46732711791992, 34.601165771484375, 36.73500061035156, 38.868839263916016, 41.00267791748047, 43.136512756347656, 45.27035140991211, 47.40419006347656, 49.53802490234375, 51.6718635559082, 53.805702209472656, 55.939537048339844, 58.0733757019043, 60.20721435546875, 62.34104919433594]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 8.0, 26.0, 27.0, 45.0, 75.0, 111.0, 137.0, 224.0, 311.0, 401.0, 711.0, 971.0, 1532.0, 2163.0, 3288.0, 4933.0, 7351.0, 11536.0, 18125.0, 27815.0, 43626.0, 69351.0, 113528.0, 181669.0, 204458.0, 132235.0, 81488.0, 50587.0, 32094.0, 20744.0, 13403.0, 8697.0, 5718.0, 3680.0, 2470.0, 1582.0, 1136.0, 773.0, 475.0, 324.0, 225.0, 163.0, 116.0, 74.0, 45.0, 30.0, 22.0, 17.0, 8.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22259140014648438, -0.21495819091796875, -0.20732498168945312, -0.1996917724609375, -0.19205856323242188, -0.18442535400390625, -0.17679214477539062, -0.169158935546875, -0.16152572631835938, -0.15389251708984375, -0.14625930786132812, -0.1386260986328125, -0.13099288940429688, -0.12335968017578125, -0.11572647094726562, -0.10809326171875, -0.10046005249023438, -0.09282684326171875, -0.08519363403320312, -0.0775604248046875, -0.06992721557617188, -0.06229400634765625, -0.054660797119140625, -0.047027587890625, -0.039394378662109375, -0.03176116943359375, -0.024127960205078125, -0.0164947509765625, -0.008861541748046875, -0.00122833251953125, 0.006404876708984375, 0.0140380859375, 0.021671295166015625, 0.02930450439453125, 0.036937713623046875, 0.0445709228515625, 0.052204132080078125, 0.05983734130859375, 0.06747055053710938, 0.075103759765625, 0.08273696899414062, 0.09037017822265625, 0.09800338745117188, 0.1056365966796875, 0.11326980590820312, 0.12090301513671875, 0.12853622436523438, 0.13616943359375, 0.14380264282226562, 0.15143585205078125, 0.15906906127929688, 0.1667022705078125, 0.17433547973632812, 0.18196868896484375, 0.18960189819335938, 0.197235107421875, 0.20486831665039062, 0.21250152587890625, 0.22013473510742188, 0.2277679443359375, 0.23540115356445312, 0.24303436279296875, 0.2506675720214844, 0.25830078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 11.0, 4.0, 10.0, 11.0, 15.0, 10.0, 23.0, 24.0, 27.0, 18.0, 28.0, 44.0, 31.0, 45.0, 41.0, 44.0, 37.0, 38.0, 38.0, 1063.0, 49.0, 43.0, 34.0, 39.0, 37.0, 39.0, 32.0, 24.0, 24.0, 18.0, 20.0, 15.0, 19.0, 10.0, 12.0, 12.0, 9.0, 8.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6976318359375, -7.434326171875, -7.1710205078125, -6.90771484375, -6.6444091796875, -6.381103515625, -6.1177978515625, -5.8544921875, -5.5911865234375, -5.327880859375, -5.0645751953125, -4.80126953125, -4.5379638671875, -4.274658203125, -4.0113525390625, -3.748046875, -3.4847412109375, -3.221435546875, -2.9581298828125, -2.69482421875, -2.4315185546875, -2.168212890625, -1.9049072265625, -1.6416015625, -1.3782958984375, -1.114990234375, -0.8516845703125, -0.58837890625, -0.3250732421875, -0.061767578125, 0.2015380859375, 0.46484375, 0.7281494140625, 0.991455078125, 1.2547607421875, 1.51806640625, 1.7813720703125, 2.044677734375, 2.3079833984375, 2.5712890625, 2.8345947265625, 3.097900390625, 3.3612060546875, 3.62451171875, 3.8878173828125, 4.151123046875, 4.4144287109375, 4.677734375, 4.9410400390625, 5.204345703125, 5.4676513671875, 5.73095703125, 5.9942626953125, 6.257568359375, 6.5208740234375, 6.7841796875, 7.0474853515625, 7.310791015625, 7.5740966796875, 7.83740234375, 8.1007080078125, 8.364013671875, 8.6273193359375, 8.890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 19.0, 17.0, 24.0, 41.0, 91.0, 97.0, 142.0, 200.0, 311.0, 472.0, 639.0, 1054.0, 1389.0, 2194.0, 3200.0, 4898.0, 7488.0, 11487.0, 17695.0, 27607.0, 43115.0, 68410.0, 111839.0, 190023.0, 1256078.0, 129643.0, 79537.0, 49504.0, 31792.0, 20409.0, 12986.0, 8249.0, 5482.0, 3626.0, 2380.0, 1547.0, 1063.0, 693.0, 556.0, 360.0, 237.0, 173.0, 117.0, 67.0, 53.0, 47.0, 25.0, 15.0, 11.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.12237548828125, -0.11856842041015625, -0.1147613525390625, -0.11095428466796875, -0.107147216796875, -0.10334014892578125, -0.0995330810546875, -0.09572601318359375, -0.0919189453125, -0.08811187744140625, -0.0843048095703125, -0.08049774169921875, -0.076690673828125, -0.07288360595703125, -0.0690765380859375, -0.06526947021484375, -0.06146240234375, -0.05765533447265625, -0.0538482666015625, -0.05004119873046875, -0.046234130859375, -0.04242706298828125, -0.0386199951171875, -0.03481292724609375, -0.031005859375, -0.02719879150390625, -0.0233917236328125, -0.01958465576171875, -0.015777587890625, -0.01197052001953125, -0.0081634521484375, -0.00435638427734375, -0.00054931640625, 0.00325775146484375, 0.0070648193359375, 0.01087188720703125, 0.014678955078125, 0.01848602294921875, 0.0222930908203125, 0.02610015869140625, 0.0299072265625, 0.03371429443359375, 0.0375213623046875, 0.04132843017578125, 0.045135498046875, 0.04894256591796875, 0.0527496337890625, 0.05655670166015625, 0.06036376953125, 0.06417083740234375, 0.0679779052734375, 0.07178497314453125, 0.075592041015625, 0.07939910888671875, 0.0832061767578125, 0.08701324462890625, 0.0908203125, 0.09462738037109375, 0.0984344482421875, 0.10224151611328125, 0.106048583984375, 0.10985565185546875, 0.1136627197265625, 0.11746978759765625, 0.12127685546875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 17.0, 23.0, 18.0, 20.0, 22.0, 25.0, 37.0, 41.0, 44.0, 47.0, 54.0, 63.0, 55.0, 56.0, 57.0, 55.0, 44.0, 36.0, 40.0, 28.0, 35.0, 20.0, 18.0, 17.0, 20.0, 13.0, 6.0, 7.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011873245239257812, -0.0011524409055709839, -0.0011175572872161865, -0.0010826736688613892, -0.0010477900505065918, -0.0010129064321517944, -0.000978022813796997, -0.0009431391954421997, -0.0009082555770874023, -0.000873371958732605, -0.0008384883403778076, -0.0008036047220230103, -0.0007687211036682129, -0.0007338374853134155, -0.0006989538669586182, -0.0006640702486038208, -0.0006291866302490234, -0.0005943030118942261, -0.0005594193935394287, -0.0005245357751846313, -0.000489652156829834, -0.0004547685384750366, -0.00041988492012023926, -0.0003850013017654419, -0.00035011768341064453, -0.00031523406505584717, -0.0002803504467010498, -0.00024546682834625244, -0.00021058320999145508, -0.00017569959163665771, -0.00014081597328186035, -0.00010593235492706299, -7.104873657226562e-05, -3.616511821746826e-05, -1.2814998626708984e-06, 3.3602118492126465e-05, 6.848573684692383e-05, 0.00010336935520172119, 0.00013825297355651855, 0.00017313659191131592, 0.00020802021026611328, 0.00024290382862091064, 0.000277787446975708, 0.00031267106533050537, 0.00034755468368530273, 0.0003824383020401001, 0.00041732192039489746, 0.0004522055387496948, 0.0004870891571044922, 0.0005219727754592896, 0.0005568563938140869, 0.0005917400121688843, 0.0006266236305236816, 0.000661507248878479, 0.0006963908672332764, 0.0007312744855880737, 0.0007661581039428711, 0.0008010417222976685, 0.0008359253406524658, 0.0008708089590072632, 0.0009056925773620605, 0.0009405761957168579, 0.0009754598140716553, 0.0010103434324264526, 0.00104522705078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 8.0, 11.0, 19.0, 17.0, 18.0, 21.0, 35.0, 32.0, 55.0, 91.0, 186.0, 503.0, 1515.0, 636541.0, 407003.0, 1444.0, 458.0, 190.0, 98.0, 50.0, 40.0, 26.0, 25.0, 22.0, 17.0, 22.0, 15.0, 19.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230712890625, -0.022301912307739258, -0.021532535552978516, -0.020763158798217773, -0.01999378204345703, -0.01922440528869629, -0.018455028533935547, -0.017685651779174805, -0.016916275024414062, -0.01614689826965332, -0.015377521514892578, -0.014608144760131836, -0.013838768005371094, -0.013069391250610352, -0.01230001449584961, -0.011530637741088867, -0.010761260986328125, -0.009991884231567383, -0.00922250747680664, -0.008453130722045898, -0.007683753967285156, -0.006914377212524414, -0.006145000457763672, -0.00537562370300293, -0.0046062469482421875, -0.0038368701934814453, -0.003067493438720703, -0.002298116683959961, -0.0015287399291992188, -0.0007593631744384766, 1.0013580322265625e-05, 0.0007793903350830078, 0.00154876708984375, 0.002318143844604492, 0.0030875205993652344, 0.0038568973541259766, 0.004626274108886719, 0.005395650863647461, 0.006165027618408203, 0.006934404373168945, 0.0077037811279296875, 0.00847315788269043, 0.009242534637451172, 0.010011911392211914, 0.010781288146972656, 0.011550664901733398, 0.01232004165649414, 0.013089418411254883, 0.013858795166015625, 0.014628171920776367, 0.01539754867553711, 0.01616692543029785, 0.016936302185058594, 0.017705678939819336, 0.018475055694580078, 0.01924443244934082, 0.020013809204101562, 0.020783185958862305, 0.021552562713623047, 0.02232193946838379, 0.02309131622314453, 0.023860692977905273, 0.024630069732666016, 0.025399446487426758, 0.0261688232421875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 995.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04389767348766327, -0.04310816153883934, -0.04231865331530571, -0.04152914136648178, -0.04073963314294815, -0.03995012119412422, -0.03916060924530029, -0.03837110102176666, -0.037581589072942734, -0.036792077124118805, -0.036002568900585175, -0.035213056951761246, -0.03442354500293732, -0.033634036779403687, -0.03284452483057976, -0.03205501660704613, -0.0312655046582222, -0.03047599457204342, -0.02968648448586464, -0.02889697253704071, -0.02810746245086193, -0.02731795236468315, -0.026528440415859222, -0.025738930329680443, -0.024949420243501663, -0.024159910157322884, -0.023370400071144104, -0.022580888122320175, -0.021791378036141396, -0.021001867949962616, -0.020212356001138687, -0.019422845914959908, -0.018633335828781128, -0.01784382574260235, -0.01705431565642357, -0.01626480370759964, -0.01547529362142086, -0.01468578353524208, -0.013896272517740726, -0.013106761500239372, -0.012317251414060593, -0.011527741327881813, -0.010738230310380459, -0.009948719292879105, -0.009159209206700325, -0.008369699120521545, -0.007580188103020191, -0.006790677551180124, -0.00600116653367877, -0.005211655981838703, -0.004422145429998636, -0.0036326348781585693, -0.0028431243263185024, -0.0020536137744784355, -0.0012641032226383686, -0.0004745926707983017, 0.0003149178810417652, 0.0011044284328818321, 0.001893938984721899, 0.002683449536561966, 0.003472960088402033, 0.0042624706402421, 0.005051981192082167, 0.005841491743922234, 0.0066310022957623005]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 7.0, 10.0, 14.0, 16.0, 30.0, 32.0, 31.0, 37.0, 46.0, 50.0, 51.0, 54.0, 52.0, 57.0, 47.0, 57.0, 49.0, 54.0, 52.0, 44.0, 27.0, 41.0, 25.0, 25.0, 26.0, 12.0, 11.0, 13.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968016624450684, -0.001146787777543068, -0.0010967738926410675, -0.001046760007739067, -0.0009967461228370667, -0.0009467322379350662, -0.0008967183530330658, -0.0008467044681310654, -0.0007966905832290649, -0.0007466766983270645, -0.0006966628134250641, -0.0006466489285230637, -0.0005966350436210632, -0.0005466211587190628, -0.0004966072738170624, -0.00044659338891506195, -0.0003965795040130615, -0.0003465656191110611, -0.00029655173420906067, -0.00024653784930706024, -0.00019652396440505981, -0.0001465100795030594, -9.649619460105896e-05, -4.648230969905853e-05, 3.5315752029418945e-06, 5.354546010494232e-05, 0.00010355934500694275, 0.00015357322990894318, 0.0002035871148109436, 0.00025360099971294403, 0.00030361488461494446, 0.0003536287695169449, 0.0004036426544189453, 0.00045365653932094574, 0.0005036704242229462, 0.0005536843091249466, 0.000603698194026947, 0.0006537120789289474, 0.0007037259638309479, 0.0007537398487329483, 0.0008037537336349487, 0.0008537676185369492, 0.0009037815034389496, 0.00095379538834095, 0.0010038092732429504, 0.0010538231581449509, 0.0011038370430469513, 0.0011538509279489517, 0.0012038648128509521, 0.0012538786977529526, 0.001303892582654953, 0.0013539064675569534, 0.0014039203524589539, 0.0014539342373609543, 0.0015039481222629547, 0.0015539620071649551, 0.0016039758920669556, 0.001653989776968956, 0.0017040036618709564, 0.0017540175467729568, 0.0018040314316749573, 0.0018540453165769577, 0.0019040592014789581, 0.0019540730863809586, 0.002004086971282959]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 19.0, 23.0, 26.0, 37.0, 54.0, 88.0, 94.0, 125.0, 196.0, 275.0, 353.0, 537.0, 721.0, 1021.0, 1511.0, 2156.0, 3350.0, 4873.0, 7661.0, 12315.0, 20738.0, 45198.0, 485957.0, 365725.0, 41618.0, 19696.0, 11756.0, 7414.0, 4731.0, 3174.0, 2113.0, 1478.0, 1012.0, 693.0, 507.0, 364.0, 256.0, 182.0, 133.0, 104.0, 69.0, 55.0, 28.0, 29.0, 19.0, 19.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-17.6875, -17.134033203125, -16.58056640625, -16.027099609375, -15.4736328125, -14.920166015625, -14.36669921875, -13.813232421875, -13.259765625, -12.706298828125, -12.15283203125, -11.599365234375, -11.0458984375, -10.492431640625, -9.93896484375, -9.385498046875, -8.83203125, -8.278564453125, -7.72509765625, -7.171630859375, -6.6181640625, -6.064697265625, -5.51123046875, -4.957763671875, -4.404296875, -3.850830078125, -3.29736328125, -2.743896484375, -2.1904296875, -1.636962890625, -1.08349609375, -0.530029296875, 0.0234375, 0.576904296875, 1.13037109375, 1.683837890625, 2.2373046875, 2.790771484375, 3.34423828125, 3.897705078125, 4.451171875, 5.004638671875, 5.55810546875, 6.111572265625, 6.6650390625, 7.218505859375, 7.77197265625, 8.325439453125, 8.87890625, 9.432373046875, 9.98583984375, 10.539306640625, 11.0927734375, 11.646240234375, 12.19970703125, 12.753173828125, 13.306640625, 13.860107421875, 14.41357421875, 14.967041015625, 15.5205078125, 16.073974609375, 16.62744140625, 17.180908203125, 17.734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 12.0, 14.0, 17.0, 16.0, 20.0, 33.0, 17.0, 34.0, 35.0, 38.0, 52.0, 43.0, 79.0, 131.0, 1648.0, 281.0, 98.0, 72.0, 57.0, 51.0, 36.0, 28.0, 35.0, 27.0, 19.0, 20.0, 20.0, 6.0, 7.0, 14.0, 10.0, 10.0, 4.0, 6.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -35.01806640625, -33.8798828125, -32.74169921875, -31.603515625, -30.46533203125, -29.3271484375, -28.18896484375, -27.05078125, -25.91259765625, -24.7744140625, -23.63623046875, -22.498046875, -21.35986328125, -20.2216796875, -19.08349609375, -17.9453125, -16.80712890625, -15.6689453125, -14.53076171875, -13.392578125, -12.25439453125, -11.1162109375, -9.97802734375, -8.83984375, -7.70166015625, -6.5634765625, -5.42529296875, -4.287109375, -3.14892578125, -2.0107421875, -0.87255859375, 0.265625, 1.40380859375, 2.5419921875, 3.68017578125, 4.818359375, 5.95654296875, 7.0947265625, 8.23291015625, 9.37109375, 10.50927734375, 11.6474609375, 12.78564453125, 13.923828125, 15.06201171875, 16.2001953125, 17.33837890625, 18.4765625, 19.61474609375, 20.7529296875, 21.89111328125, 23.029296875, 24.16748046875, 25.3056640625, 26.44384765625, 27.58203125, 28.72021484375, 29.8583984375, 30.99658203125, 32.134765625, 33.27294921875, 34.4111328125, 35.54931640625, 36.6875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 14.0, 19.0, 18.0, 35.0, 32.0, 37.0, 44.0, 68.0, 102.0, 123.0, 228.0, 481.0, 1618.0, 7972.0, 73557.0, 3010436.0, 42776.0, 5825.0, 1201.0, 376.0, 188.0, 127.0, 82.0, 71.0, 46.0, 47.0, 32.0, 31.0, 21.0, 21.0, 13.0, 14.0, 3.0, 8.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.125, -72.654296875, -70.18359375, -67.712890625, -65.2421875, -62.771484375, -60.30078125, -57.830078125, -55.359375, -52.888671875, -50.41796875, -47.947265625, -45.4765625, -43.005859375, -40.53515625, -38.064453125, -35.59375, -33.123046875, -30.65234375, -28.181640625, -25.7109375, -23.240234375, -20.76953125, -18.298828125, -15.828125, -13.357421875, -10.88671875, -8.416015625, -5.9453125, -3.474609375, -1.00390625, 1.466796875, 3.9375, 6.408203125, 8.87890625, 11.349609375, 13.8203125, 16.291015625, 18.76171875, 21.232421875, 23.703125, 26.173828125, 28.64453125, 31.115234375, 33.5859375, 36.056640625, 38.52734375, 40.998046875, 43.46875, 45.939453125, 48.41015625, 50.880859375, 53.3515625, 55.822265625, 58.29296875, 60.763671875, 63.234375, 65.705078125, 68.17578125, 70.646484375, 73.1171875, 75.587890625, 78.05859375, 80.529296875, 83.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 57.0, 115.0, 327.0, 268.0, 162.0, 52.0, 13.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.46795654296875, -282.6966857910156, -276.9254455566406, -271.1541748046875, -265.3829345703125, -259.6116638183594, -253.84042358398438, -248.0691680908203, -242.29791259765625, -236.5266571044922, -230.75540161132812, -224.98414611816406, -219.212890625, -213.44163513183594, -207.67037963867188, -201.8991241455078, -196.12786865234375, -190.3566131591797, -184.58535766601562, -178.81410217285156, -173.0428466796875, -167.27159118652344, -161.50033569335938, -155.7290802001953, -149.9578094482422, -144.18655395507812, -138.41529846191406, -132.64404296875, -126.87278747558594, -121.10153198242188, -115.33027648925781, -109.55902099609375, -103.78777313232422, -98.01651763916016, -92.2452621459961, -86.47400665283203, -80.70275115966797, -74.9314956665039, -69.16023254394531, -63.388980865478516, -57.61772537231445, -51.84646987915039, -46.07521438598633, -40.303955078125, -34.53269958496094, -28.761445999145508, -22.990188598632812, -17.21893310546875, -11.447677612304688, -5.676421642303467, 0.0948343276977539, 5.866090774536133, 11.637346267700195, 17.408601760864258, 23.179859161376953, 28.951114654541016, 34.72237014770508, 40.49362564086914, 46.2648811340332, 52.03614044189453, 57.807395935058594, 63.578651428222656, 69.34990692138672, 75.12116241455078, 80.89241790771484]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 10.0, 5.0, 11.0, 15.0, 17.0, 17.0, 18.0, 22.0, 15.0, 19.0, 25.0, 21.0, 28.0, 36.0, 29.0, 43.0, 29.0, 38.0, 39.0, 43.0, 41.0, 44.0, 36.0, 34.0, 39.0, 43.0, 39.0, 32.0, 29.0, 19.0, 21.0, 24.0, 13.0, 20.0, 17.0, 12.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-83.98104095458984, -81.23321533203125, -78.48538970947266, -75.7375717163086, -72.98974609375, -70.2419204711914, -67.49409484863281, -64.74627685546875, -61.998451232910156, -59.25062561035156, -56.502803802490234, -53.75497817993164, -51.00715637207031, -48.25933074951172, -45.511505126953125, -42.7636833190918, -40.0158576965332, -37.26803207397461, -34.52021026611328, -31.772384643554688, -29.02456283569336, -26.276737213134766, -23.528913497924805, -20.781089782714844, -18.033266067504883, -15.285442352294922, -12.537618637084961, -9.789793968200684, -7.041970252990723, -4.294146537780762, -1.5463218688964844, 1.2015018463134766, 3.9493255615234375, 6.697149276733398, 9.44497299194336, 12.192797660827637, 14.940621376037598, 17.688446044921875, 20.436269760131836, 23.184093475341797, 25.931917190551758, 28.67974090576172, 31.42756462097168, 34.17538833618164, 36.923213958740234, 39.67103576660156, 42.418861389160156, 45.16668701171875, 47.91450881958008, 50.66233444213867, 53.41015625, 56.157981872558594, 58.90580368041992, 61.653629302978516, 64.40145111083984, 67.14927673339844, 69.89710235595703, 72.64492797851562, 75.39275360107422, 78.14057159423828, 80.88839721679688, 83.63622283935547, 86.38404846191406, 89.13186645507812, 91.87969207763672]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 8.0, 7.0, 3.0, 8.0, 15.0, 18.0, 20.0, 28.0, 29.0, 32.0, 30.0, 38.0, 30.0, 49.0, 36.0, 38.0, 38.0, 46.0, 49.0, 34.0, 35.0, 39.0, 29.0, 45.0, 35.0, 34.0, 27.0, 38.0, 19.0, 17.0, 20.0, 16.0, 18.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0806884765625, -11.716064453125, -11.3514404296875, -10.98681640625, -10.6221923828125, -10.257568359375, -9.8929443359375, -9.5283203125, -9.1636962890625, -8.799072265625, -8.4344482421875, -8.06982421875, -7.7052001953125, -7.340576171875, -6.9759521484375, -6.611328125, -6.2467041015625, -5.882080078125, -5.5174560546875, -5.15283203125, -4.7882080078125, -4.423583984375, -4.0589599609375, -3.6943359375, -3.3297119140625, -2.965087890625, -2.6004638671875, -2.23583984375, -1.8712158203125, -1.506591796875, -1.1419677734375, -0.77734375, -0.4127197265625, -0.048095703125, 0.3165283203125, 0.68115234375, 1.0457763671875, 1.410400390625, 1.7750244140625, 2.1396484375, 2.5042724609375, 2.868896484375, 3.2335205078125, 3.59814453125, 3.9627685546875, 4.327392578125, 4.6920166015625, 5.056640625, 5.4212646484375, 5.785888671875, 6.1505126953125, 6.51513671875, 6.8797607421875, 7.244384765625, 7.6090087890625, 7.9736328125, 8.3382568359375, 8.702880859375, 9.0675048828125, 9.43212890625, 9.7967529296875, 10.161376953125, 10.5260009765625, 10.890625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 9.0, 5.0, 6.0, 10.0, 17.0, 27.0, 18.0, 34.0, 32.0, 45.0, 59.0, 83.0, 85.0, 144.0, 222.0, 382.0, 672.0, 1366.0, 3198.0, 8733.0, 31378.0, 570900.0, 3307796.0, 235309.0, 22153.0, 6558.0, 2448.0, 1068.0, 529.0, 273.0, 177.0, 118.0, 106.0, 67.0, 54.0, 53.0, 43.0, 20.0, 17.0, 15.0, 12.0, 17.0, 6.0, 2.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.53125, -36.40673828125, -35.2822265625, -34.15771484375, -33.033203125, -31.90869140625, -30.7841796875, -29.65966796875, -28.53515625, -27.41064453125, -26.2861328125, -25.16162109375, -24.037109375, -22.91259765625, -21.7880859375, -20.66357421875, -19.5390625, -18.41455078125, -17.2900390625, -16.16552734375, -15.041015625, -13.91650390625, -12.7919921875, -11.66748046875, -10.54296875, -9.41845703125, -8.2939453125, -7.16943359375, -6.044921875, -4.92041015625, -3.7958984375, -2.67138671875, -1.546875, -0.42236328125, 0.7021484375, 1.82666015625, 2.951171875, 4.07568359375, 5.2001953125, 6.32470703125, 7.44921875, 8.57373046875, 9.6982421875, 10.82275390625, 11.947265625, 13.07177734375, 14.1962890625, 15.32080078125, 16.4453125, 17.56982421875, 18.6943359375, 19.81884765625, 20.943359375, 22.06787109375, 23.1923828125, 24.31689453125, 25.44140625, 26.56591796875, 27.6904296875, 28.81494140625, 29.939453125, 31.06396484375, 32.1884765625, 33.31298828125, 34.4375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 20.0, 24.0, 32.0, 44.0, 55.0, 80.0, 129.0, 254.0, 441.0, 778.0, 852.0, 567.0, 304.0, 137.0, 89.0, 56.0, 44.0, 30.0, 26.0, 17.0, 12.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.734375, -27.8125, -26.890625, -25.96875, -25.046875, -24.125, -23.203125, -22.28125, -21.359375, -20.4375, -19.515625, -18.59375, -17.671875, -16.75, -15.828125, -14.90625, -13.984375, -13.0625, -12.140625, -11.21875, -10.296875, -9.375, -8.453125, -7.53125, -6.609375, -5.6875, -4.765625, -3.84375, -2.921875, -2.0, -1.078125, -0.15625, 0.765625, 1.6875, 2.609375, 3.53125, 4.453125, 5.375, 6.296875, 7.21875, 8.140625, 9.0625, 9.984375, 10.90625, 11.828125, 12.75, 13.671875, 14.59375, 15.515625, 16.4375, 17.359375, 18.28125, 19.203125, 20.125, 21.046875, 21.96875, 22.890625, 23.8125, 24.734375, 25.65625, 26.578125, 27.5, 28.421875, 29.34375, 30.265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 24.0, 29.0, 46.0, 68.0, 123.0, 218.0, 700.0, 3311.0, 41140.0, 3933711.0, 205214.0, 7665.0, 1170.0, 338.0, 181.0, 105.0, 47.0, 46.0, 29.0, 18.0, 15.0, 17.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-105.0, -101.7890625, -98.578125, -95.3671875, -92.15625, -88.9453125, -85.734375, -82.5234375, -79.3125, -76.1015625, -72.890625, -69.6796875, -66.46875, -63.2578125, -60.046875, -56.8359375, -53.625, -50.4140625, -47.203125, -43.9921875, -40.78125, -37.5703125, -34.359375, -31.1484375, -27.9375, -24.7265625, -21.515625, -18.3046875, -15.09375, -11.8828125, -8.671875, -5.4609375, -2.25, 0.9609375, 4.171875, 7.3828125, 10.59375, 13.8046875, 17.015625, 20.2265625, 23.4375, 26.6484375, 29.859375, 33.0703125, 36.28125, 39.4921875, 42.703125, 45.9140625, 49.125, 52.3359375, 55.546875, 58.7578125, 61.96875, 65.1796875, 68.390625, 71.6015625, 74.8125, 78.0234375, 81.234375, 84.4453125, 87.65625, 90.8671875, 94.078125, 97.2890625, 100.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 21.0, 37.0, 85.0, 142.0, 232.0, 217.0, 135.0, 70.0, 33.0, 18.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.5796890258789, -107.28607940673828, -100.99246215820312, -94.6988525390625, -88.40523529052734, -82.11162567138672, -75.81800842285156, -69.52439880371094, -63.23078536987305, -56.937171936035156, -50.643558502197266, -44.349945068359375, -38.05633544921875, -31.762720108032227, -25.46910858154297, -19.175495147705078, -12.881881713867188, -6.588268756866455, -0.29465579986572266, 5.998956680297852, 12.292570114135742, 18.586183547973633, 24.87979507446289, 31.17340850830078, 37.46702194213867, 43.76063537597656, 50.05424880981445, 56.347862243652344, 62.64147186279297, 68.93508911132812, 75.22869873046875, 81.52230834960938, 87.81593322753906, 94.10954284667969, 100.40316009521484, 106.69676971435547, 112.99038696289062, 119.28399658203125, 125.57760620117188, 131.8712158203125, 138.1648406982422, 144.4584503173828, 150.75205993652344, 157.04568481445312, 163.33929443359375, 169.63290405273438, 175.926513671875, 182.22012329101562, 188.51373291015625, 194.80734252929688, 201.1009521484375, 207.3945770263672, 213.6881866455078, 219.98179626464844, 226.27540588378906, 232.56903076171875, 238.86264038085938, 245.15625, 251.44985961914062, 257.74346923828125, 264.0370788574219, 270.3307189941406, 276.62432861328125, 282.9179382324219, 289.2115478515625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 14.0, 11.0, 14.0, 23.0, 17.0, 19.0, 16.0, 30.0, 24.0, 38.0, 33.0, 32.0, 41.0, 36.0, 40.0, 36.0, 39.0, 39.0, 49.0, 27.0, 36.0, 45.0, 29.0, 34.0, 29.0, 24.0, 22.0, 29.0, 24.0, 27.0, 13.0, 14.0, 8.0, 12.0, 8.0, 8.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.63673400878906, -63.30698776245117, -60.97724533081055, -58.647499084472656, -56.31775665283203, -53.98801040649414, -51.65826416015625, -49.328521728515625, -46.998775482177734, -44.669029235839844, -42.33928680419922, -40.00954055786133, -37.67979431152344, -35.35005187988281, -33.02030563354492, -30.690561294555664, -28.360816955566406, -26.03107261657715, -23.70132827758789, -21.37158203125, -19.041837692260742, -16.712093353271484, -14.38234806060791, -12.052602767944336, -9.722858428955078, -7.393113613128662, -5.063368797302246, -2.73362398147583, -0.40387916564941406, 1.9258651733398438, 4.255610466003418, 6.585355758666992, 8.91510009765625, 11.244844436645508, 13.574589729309082, 15.904335021972656, 18.234079360961914, 20.563823699951172, 22.893569946289062, 25.22331428527832, 27.553058624267578, 29.882802963256836, 32.212547302246094, 34.542293548583984, 36.872039794921875, 39.2017822265625, 41.53152847290039, 43.86127471923828, 46.191017150878906, 48.5207633972168, 50.85050582885742, 53.18025207519531, 55.50999450683594, 57.83974075317383, 60.16948699951172, 62.499229431152344, 64.8289794921875, 67.15872192382812, 69.48847198486328, 71.8182144165039, 74.14795684814453, 76.47770690917969, 78.80744934082031, 81.13719177246094, 83.46693420410156]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 15.0, 13.0, 16.0, 36.0, 43.0, 84.0, 125.0, 181.0, 316.0, 498.0, 824.0, 1199.0, 2013.0, 3313.0, 5221.0, 8644.0, 14412.0, 24489.0, 42307.0, 73871.0, 133143.0, 238699.0, 217301.0, 119529.0, 67412.0, 38504.0, 22531.0, 13167.0, 8006.0, 4710.0, 2983.0, 1874.0, 1120.0, 724.0, 440.0, 295.0, 174.0, 114.0, 73.0, 44.0, 31.0, 28.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.32666015625, -0.3170280456542969, -0.30739593505859375, -0.2977638244628906, -0.2881317138671875, -0.2784996032714844, -0.26886749267578125, -0.2592353820800781, -0.249603271484375, -0.23997116088867188, -0.23033905029296875, -0.22070693969726562, -0.2110748291015625, -0.20144271850585938, -0.19181060791015625, -0.18217849731445312, -0.17254638671875, -0.16291427612304688, -0.15328216552734375, -0.14365005493164062, -0.1340179443359375, -0.12438583374023438, -0.11475372314453125, -0.10512161254882812, -0.095489501953125, -0.08585739135742188, -0.07622528076171875, -0.06659317016601562, -0.0569610595703125, -0.047328948974609375, -0.03769683837890625, -0.028064727783203125, -0.0184326171875, -0.008800506591796875, 0.00083160400390625, 0.010463714599609375, 0.0200958251953125, 0.029727935791015625, 0.03936004638671875, 0.048992156982421875, 0.058624267578125, 0.06825637817382812, 0.07788848876953125, 0.08752059936523438, 0.0971527099609375, 0.10678482055664062, 0.11641693115234375, 0.12604904174804688, 0.13568115234375, 0.14531326293945312, 0.15494537353515625, 0.16457748413085938, 0.1742095947265625, 0.18384170532226562, 0.19347381591796875, 0.20310592651367188, 0.212738037109375, 0.22237014770507812, 0.23200225830078125, 0.24163436889648438, 0.2512664794921875, 0.2608985900878906, 0.27053070068359375, 0.2801628112792969, 0.289794921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 5.0, 6.0, 10.0, 13.0, 11.0, 14.0, 17.0, 27.0, 21.0, 30.0, 25.0, 37.0, 38.0, 37.0, 32.0, 31.0, 39.0, 32.0, 51.0, 1067.0, 39.0, 47.0, 36.0, 42.0, 36.0, 39.0, 28.0, 31.0, 31.0, 24.0, 16.0, 26.0, 12.0, 12.0, 15.0, 9.0, 9.0, 5.0, 4.0, 6.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.75, -9.458984375, -9.16796875, -8.876953125, -8.5859375, -8.294921875, -8.00390625, -7.712890625, -7.421875, -7.130859375, -6.83984375, -6.548828125, -6.2578125, -5.966796875, -5.67578125, -5.384765625, -5.09375, -4.802734375, -4.51171875, -4.220703125, -3.9296875, -3.638671875, -3.34765625, -3.056640625, -2.765625, -2.474609375, -2.18359375, -1.892578125, -1.6015625, -1.310546875, -1.01953125, -0.728515625, -0.4375, -0.146484375, 0.14453125, 0.435546875, 0.7265625, 1.017578125, 1.30859375, 1.599609375, 1.890625, 2.181640625, 2.47265625, 2.763671875, 3.0546875, 3.345703125, 3.63671875, 3.927734375, 4.21875, 4.509765625, 4.80078125, 5.091796875, 5.3828125, 5.673828125, 5.96484375, 6.255859375, 6.546875, 6.837890625, 7.12890625, 7.419921875, 7.7109375, 8.001953125, 8.29296875, 8.583984375, 8.875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 5.0, 2.0, 4.0, 3.0, 7.0, 14.0, 14.0, 12.0, 16.0, 39.0, 59.0, 61.0, 113.0, 156.0, 228.0, 322.0, 471.0, 650.0, 899.0, 1292.0, 1877.0, 2677.0, 3955.0, 5607.0, 8550.0, 13106.0, 19830.0, 30262.0, 46790.0, 72628.0, 116999.0, 311714.0, 1123449.0, 119730.0, 75081.0, 47820.0, 31141.0, 20526.0, 13401.0, 8696.0, 5947.0, 3919.0, 2728.0, 1902.0, 1266.0, 909.0, 671.0, 440.0, 350.0, 252.0, 169.0, 112.0, 85.0, 63.0, 49.0, 29.0, 20.0, 13.0, 4.0, 5.0, 3.0, 0.0, 5.0], "bins": [-0.1302490234375, -0.12630558013916016, -0.12236213684082031, -0.11841869354248047, -0.11447525024414062, -0.11053180694580078, -0.10658836364746094, -0.1026449203491211, -0.09870147705078125, -0.0947580337524414, -0.09081459045410156, -0.08687114715576172, -0.08292770385742188, -0.07898426055908203, -0.07504081726074219, -0.07109737396240234, -0.0671539306640625, -0.06321048736572266, -0.05926704406738281, -0.05532360076904297, -0.051380157470703125, -0.04743671417236328, -0.04349327087402344, -0.039549827575683594, -0.03560638427734375, -0.031662940979003906, -0.027719497680664062, -0.02377605438232422, -0.019832611083984375, -0.01588916778564453, -0.011945724487304688, -0.008002281188964844, -0.004058837890625, -0.00011539459228515625, 0.0038280487060546875, 0.007771492004394531, 0.011714935302734375, 0.01565837860107422, 0.019601821899414062, 0.023545265197753906, 0.02748870849609375, 0.031432151794433594, 0.03537559509277344, 0.03931903839111328, 0.043262481689453125, 0.04720592498779297, 0.05114936828613281, 0.055092811584472656, 0.0590362548828125, 0.06297969818115234, 0.06692314147949219, 0.07086658477783203, 0.07481002807617188, 0.07875347137451172, 0.08269691467285156, 0.0866403579711914, 0.09058380126953125, 0.0945272445678711, 0.09847068786621094, 0.10241413116455078, 0.10635757446289062, 0.11030101776123047, 0.11424446105957031, 0.11818790435791016, 0.12213134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 3.0, 1.0, 6.0, 9.0, 13.0, 12.0, 9.0, 16.0, 17.0, 17.0, 20.0, 15.0, 37.0, 30.0, 34.0, 36.0, 49.0, 41.0, 43.0, 62.0, 59.0, 51.0, 44.0, 52.0, 42.0, 43.0, 28.0, 33.0, 30.0, 27.0, 13.0, 16.0, 13.0, 16.0, 8.0, 13.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0009794235229492188, -0.0009486228227615356, -0.0009178221225738525, -0.0008870214223861694, -0.0008562207221984863, -0.0008254200220108032, -0.0007946193218231201, -0.000763818621635437, -0.0007330179214477539, -0.0007022172212600708, -0.0006714165210723877, -0.0006406158208847046, -0.0006098151206970215, -0.0005790144205093384, -0.0005482137203216553, -0.0005174130201339722, -0.00048661231994628906, -0.00045581161975860596, -0.00042501091957092285, -0.00039421021938323975, -0.00036340951919555664, -0.00033260881900787354, -0.00030180811882019043, -0.0002710074186325073, -0.00024020671844482422, -0.0002094060182571411, -0.000178605318069458, -0.0001478046178817749, -0.0001170039176940918, -8.620321750640869e-05, -5.5402517318725586e-05, -2.460181713104248e-05, 6.198883056640625e-06, 3.699958324432373e-05, 6.780028343200684e-05, 9.860098361968994e-05, 0.00012940168380737305, 0.00016020238399505615, 0.00019100308418273926, 0.00022180378437042236, 0.00025260448455810547, 0.0002834051847457886, 0.0003142058849334717, 0.0003450065851211548, 0.0003758072853088379, 0.000406607985496521, 0.0004374086856842041, 0.0004682093858718872, 0.0004990100860595703, 0.0005298107862472534, 0.0005606114864349365, 0.0005914121866226196, 0.0006222128868103027, 0.0006530135869979858, 0.0006838142871856689, 0.000714614987373352, 0.0007454156875610352, 0.0007762163877487183, 0.0008070170879364014, 0.0008378177881240845, 0.0008686184883117676, 0.0008994191884994507, 0.0009302198886871338, 0.0009610205888748169, 0.0009918212890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 7.0, 11.0, 8.0, 17.0, 12.0, 15.0, 16.0, 28.0, 35.0, 35.0, 44.0, 89.0, 180.0, 401.0, 1119.0, 55831.0, 986733.0, 2675.0, 581.0, 232.0, 115.0, 68.0, 53.0, 33.0, 35.0, 18.0, 19.0, 18.0, 20.0, 14.0, 9.0, 11.0, 14.0, 8.0, 6.0, 2.0, 3.0, 6.0, 9.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0220184326171875, -0.02133488655090332, -0.02065134048461914, -0.01996779441833496, -0.01928424835205078, -0.0186007022857666, -0.017917156219482422, -0.017233610153198242, -0.016550064086914062, -0.015866518020629883, -0.015182971954345703, -0.014499425888061523, -0.013815879821777344, -0.013132333755493164, -0.012448787689208984, -0.011765241622924805, -0.011081695556640625, -0.010398149490356445, -0.009714603424072266, -0.009031057357788086, -0.008347511291503906, -0.0076639652252197266, -0.006980419158935547, -0.006296873092651367, -0.0056133270263671875, -0.004929780960083008, -0.004246234893798828, -0.0035626888275146484, -0.0028791427612304688, -0.002195596694946289, -0.0015120506286621094, -0.0008285045623779297, -0.00014495849609375, 0.0005385875701904297, 0.0012221336364746094, 0.001905679702758789, 0.0025892257690429688, 0.0032727718353271484, 0.003956317901611328, 0.004639863967895508, 0.0053234100341796875, 0.006006956100463867, 0.006690502166748047, 0.0073740482330322266, 0.008057594299316406, 0.008741140365600586, 0.009424686431884766, 0.010108232498168945, 0.010791778564453125, 0.011475324630737305, 0.012158870697021484, 0.012842416763305664, 0.013525962829589844, 0.014209508895874023, 0.014893054962158203, 0.015576601028442383, 0.016260147094726562, 0.016943693161010742, 0.017627239227294922, 0.0183107852935791, 0.01899433135986328, 0.01967787742614746, 0.02036142349243164, 0.02104496955871582, 0.021728515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 397.0, 613.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022900115698575974, -0.022442439571022987, -0.02198476344347, -0.021527087315917015, -0.02106941118836403, -0.020611733198165894, -0.020154058933258057, -0.01969638094305992, -0.019238704815506935, -0.01878102868795395, -0.018323352560400963, -0.017865676432847977, -0.01740800030529499, -0.016950324177742004, -0.01649264618754387, -0.016034970059990883, -0.015577294863760471, -0.015119618736207485, -0.014661942608654499, -0.014204265549778938, -0.013746589422225952, -0.013288913294672966, -0.01283123716711998, -0.012373561039566994, -0.011915884912014008, -0.011458208784461021, -0.011000532656908035, -0.01054285652935505, -0.010085179470479488, -0.009627503342926502, -0.009169827215373516, -0.00871215108782053, -0.008254473097622395, -0.007796796970069408, -0.007339120376855135, -0.006881444249302149, -0.006423767656087875, -0.005966091528534889, -0.005508415400981903, -0.005050739273428917, -0.0045930626802146435, -0.004135386552661657, -0.003677709959447384, -0.0032200338318943977, -0.002762357471510768, -0.002304681111127138, -0.001847004983574152, -0.0013893286231905222, -0.0009316522628068924, -0.0004739759606309235, -1.6299658454954624e-05, 0.00044137658551335335, 0.0008990529458969831, 0.001356729306280613, 0.001814405433833599, 0.002272081794217229, 0.0027297581546008587, 0.0031874345149844885, 0.0036451108753681183, 0.004102787002921104, 0.004560463130474091, 0.005018139723688364, 0.00547581585124135, 0.005933492444455624, 0.00639116857200861]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 9.0, 12.0, 16.0, 13.0, 24.0, 25.0, 34.0, 29.0, 31.0, 35.0, 40.0, 49.0, 55.0, 52.0, 48.0, 44.0, 56.0, 47.0, 43.0, 33.0, 49.0, 43.0, 35.0, 31.0, 28.0, 19.0, 14.0, 15.0, 14.0, 12.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010987520217895508, -0.0010580597445368767, -0.0010173674672842026, -0.0009766751900315285, -0.0009359829127788544, -0.0008952906355261803, -0.0008545983582735062, -0.0008139060810208321, -0.000773213803768158, -0.0007325215265154839, -0.0006918292492628098, -0.0006511369720101357, -0.0006104446947574615, -0.0005697524175047874, -0.0005290601402521133, -0.0004883678629994392, -0.00044767558574676514, -0.00040698330849409103, -0.00036629103124141693, -0.00032559875398874283, -0.0002849064767360687, -0.0002442141994833946, -0.00020352192223072052, -0.00016282964497804642, -0.00012213736772537231, -8.144509047269821e-05, -4.075281322002411e-05, -6.05359673500061e-08, 4.06317412853241e-05, 8.13240185379982e-05, 0.0001220162957906723, 0.0001627085730433464, 0.0002034008502960205, 0.0002440931275486946, 0.0002847854048013687, 0.0003254776820540428, 0.0003661699593067169, 0.000406862236559391, 0.0004475545138120651, 0.00048824679106473923, 0.0005289390683174133, 0.0005696313455700874, 0.0006103236228227615, 0.0006510159000754356, 0.0006917081773281097, 0.0007324004545807838, 0.000773092731833458, 0.000813785009086132, 0.0008544772863388062, 0.0008951695635914803, 0.0009358618408441544, 0.0009765541180968285, 0.0010172463953495026, 0.0010579386726021767, 0.0010986309498548508, 0.0011393232271075249, 0.001180015504360199, 0.001220707781612873, 0.0012614000588655472, 0.0013020923361182213, 0.0013427846133708954, 0.0013834768906235695, 0.0014241691678762436, 0.0014648614451289177, 0.0015055537223815918]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 11.0, 17.0, 22.0, 31.0, 37.0, 67.0, 80.0, 126.0, 149.0, 221.0, 327.0, 492.0, 777.0, 1082.0, 1694.0, 2586.0, 4183.0, 7570.0, 15172.0, 48859.0, 613288.0, 289859.0, 32559.0, 12322.0, 6343.0, 3751.0, 2301.0, 1478.0, 991.0, 644.0, 457.0, 302.0, 218.0, 176.0, 94.0, 64.0, 64.0, 32.0, 26.0, 10.0, 21.0, 8.0, 12.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-17.015625, -16.51318359375, -16.0107421875, -15.50830078125, -15.005859375, -14.50341796875, -14.0009765625, -13.49853515625, -12.99609375, -12.49365234375, -11.9912109375, -11.48876953125, -10.986328125, -10.48388671875, -9.9814453125, -9.47900390625, -8.9765625, -8.47412109375, -7.9716796875, -7.46923828125, -6.966796875, -6.46435546875, -5.9619140625, -5.45947265625, -4.95703125, -4.45458984375, -3.9521484375, -3.44970703125, -2.947265625, -2.44482421875, -1.9423828125, -1.43994140625, -0.9375, -0.43505859375, 0.0673828125, 0.56982421875, 1.072265625, 1.57470703125, 2.0771484375, 2.57958984375, 3.08203125, 3.58447265625, 4.0869140625, 4.58935546875, 5.091796875, 5.59423828125, 6.0966796875, 6.59912109375, 7.1015625, 7.60400390625, 8.1064453125, 8.60888671875, 9.111328125, 9.61376953125, 10.1162109375, 10.61865234375, 11.12109375, 11.62353515625, 12.1259765625, 12.62841796875, 13.130859375, 13.63330078125, 14.1357421875, 14.63818359375, 15.140625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 10.0, 15.0, 18.0, 17.0, 26.0, 30.0, 32.0, 46.0, 53.0, 33.0, 46.0, 58.0, 80.0, 378.0, 1619.0, 92.0, 65.0, 55.0, 44.0, 38.0, 29.0, 41.0, 25.0, 34.0, 18.0, 18.0, 13.0, 17.0, 8.0, 6.0, 11.0, 5.0, 3.0, 6.0, 9.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.41650390625, -33.1455078125, -31.87451171875, -30.603515625, -29.33251953125, -28.0615234375, -26.79052734375, -25.51953125, -24.24853515625, -22.9775390625, -21.70654296875, -20.435546875, -19.16455078125, -17.8935546875, -16.62255859375, -15.3515625, -14.08056640625, -12.8095703125, -11.53857421875, -10.267578125, -8.99658203125, -7.7255859375, -6.45458984375, -5.18359375, -3.91259765625, -2.6416015625, -1.37060546875, -0.099609375, 1.17138671875, 2.4423828125, 3.71337890625, 4.984375, 6.25537109375, 7.5263671875, 8.79736328125, 10.068359375, 11.33935546875, 12.6103515625, 13.88134765625, 15.15234375, 16.42333984375, 17.6943359375, 18.96533203125, 20.236328125, 21.50732421875, 22.7783203125, 24.04931640625, 25.3203125, 26.59130859375, 27.8623046875, 29.13330078125, 30.404296875, 31.67529296875, 32.9462890625, 34.21728515625, 35.48828125, 36.75927734375, 38.0302734375, 39.30126953125, 40.572265625, 41.84326171875, 43.1142578125, 44.38525390625, 45.65625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 10.0, 7.0, 7.0, 11.0, 12.0, 8.0, 12.0, 19.0, 27.0, 25.0, 40.0, 61.0, 75.0, 90.0, 101.0, 150.0, 266.0, 698.0, 2972.0, 23391.0, 2989555.0, 118163.0, 7421.0, 1394.0, 388.0, 205.0, 135.0, 109.0, 77.0, 66.0, 47.0, 39.0, 31.0, 20.0, 12.0, 12.0, 10.0, 13.0, 9.0, 11.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-82.8125, -80.49609375, -78.1796875, -75.86328125, -73.546875, -71.23046875, -68.9140625, -66.59765625, -64.28125, -61.96484375, -59.6484375, -57.33203125, -55.015625, -52.69921875, -50.3828125, -48.06640625, -45.75, -43.43359375, -41.1171875, -38.80078125, -36.484375, -34.16796875, -31.8515625, -29.53515625, -27.21875, -24.90234375, -22.5859375, -20.26953125, -17.953125, -15.63671875, -13.3203125, -11.00390625, -8.6875, -6.37109375, -4.0546875, -1.73828125, 0.578125, 2.89453125, 5.2109375, 7.52734375, 9.84375, 12.16015625, 14.4765625, 16.79296875, 19.109375, 21.42578125, 23.7421875, 26.05859375, 28.375, 30.69140625, 33.0078125, 35.32421875, 37.640625, 39.95703125, 42.2734375, 44.58984375, 46.90625, 49.22265625, 51.5390625, 53.85546875, 56.171875, 58.48828125, 60.8046875, 63.12109375, 65.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 28.0, 447.0, 512.0, 33.0], "bins": [-662.664794921875, -651.9754638671875, -641.2861938476562, -630.5968627929688, -619.9075927734375, -609.21826171875, -598.5289916992188, -587.8396606445312, -577.150390625, -566.4610595703125, -555.7717895507812, -545.0824584960938, -534.3931884765625, -523.703857421875, -513.0145874023438, -502.3252868652344, -491.635986328125, -480.9466857910156, -470.25738525390625, -459.5680847167969, -448.8787841796875, -438.1894836425781, -427.50018310546875, -416.8108825683594, -406.1215515136719, -395.4322509765625, -384.7429504394531, -374.05364990234375, -363.3643493652344, -352.675048828125, -341.9857482910156, -331.29644775390625, -320.6071472167969, -309.9178466796875, -299.2285461425781, -288.53924560546875, -277.8499450683594, -267.16064453125, -256.4713439941406, -245.78204345703125, -235.09274291992188, -224.4034423828125, -213.71414184570312, -203.02484130859375, -192.33554077148438, -181.646240234375, -170.95693969726562, -160.26763916015625, -149.57833862304688, -138.8890380859375, -128.19973754882812, -117.51043701171875, -106.82113647460938, -96.1318359375, -85.4425277709961, -74.75322723388672, -64.06391906738281, -53.37461853027344, -42.68531799316406, -31.996013641357422, -21.306713104248047, -10.617412567138672, 0.07189178466796875, 10.761192321777344, 21.450489044189453]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 6.0, 6.0, 12.0, 10.0, 15.0, 11.0, 16.0, 19.0, 21.0, 24.0, 40.0, 35.0, 28.0, 24.0, 32.0, 28.0, 40.0, 43.0, 40.0, 34.0, 35.0, 32.0, 35.0, 37.0, 35.0, 41.0, 32.0, 33.0, 34.0, 31.0, 22.0, 17.0, 11.0, 20.0, 10.0, 14.0, 12.0, 5.0, 13.0, 8.0, 6.0, 5.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.49776458740234, -78.55269622802734, -75.60762786865234, -72.66256713867188, -69.71749877929688, -66.77243041992188, -63.827362060546875, -60.88229751586914, -57.937232971191406, -54.992164611816406, -52.04710006713867, -49.10203170776367, -46.15696716308594, -43.21189880371094, -40.26683044433594, -37.3217658996582, -34.3766975402832, -31.431631088256836, -28.48656463623047, -25.54149627685547, -22.596431732177734, -19.651363372802734, -16.706296920776367, -13.76123046875, -10.816164016723633, -7.871097564697266, -4.92603063583374, -1.9809637069702148, 0.9641027450561523, 3.9091691970825195, 6.854236602783203, 9.79930305480957, 12.744369506835938, 15.689435958862305, 18.634502410888672, 21.579570770263672, 24.524635314941406, 27.469703674316406, 30.414770126342773, 33.35983657836914, 36.304901123046875, 39.249969482421875, 42.19503402709961, 45.14010238647461, 48.085166931152344, 51.030235290527344, 53.975303649902344, 56.92036819458008, 59.86543655395508, 62.81050491333008, 65.75556945800781, 68.70063781738281, 71.64570617675781, 74.59076690673828, 77.53583526611328, 80.48090362548828, 83.42597198486328, 86.37104034423828, 89.31610870361328, 92.26116943359375, 95.20623779296875, 98.15130615234375, 101.09637451171875, 104.04144287109375, 106.98650360107422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 11.0, 16.0, 18.0, 14.0, 14.0, 23.0, 37.0, 34.0, 39.0, 32.0, 39.0, 37.0, 36.0, 55.0, 44.0, 44.0, 41.0, 52.0, 33.0, 30.0, 34.0, 47.0, 24.0, 28.0, 23.0, 36.0, 20.0, 22.0, 13.0, 10.0, 13.0, 11.0, 8.0, 10.0, 4.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-13.3125, -12.939453125, -12.56640625, -12.193359375, -11.8203125, -11.447265625, -11.07421875, -10.701171875, -10.328125, -9.955078125, -9.58203125, -9.208984375, -8.8359375, -8.462890625, -8.08984375, -7.716796875, -7.34375, -6.970703125, -6.59765625, -6.224609375, -5.8515625, -5.478515625, -5.10546875, -4.732421875, -4.359375, -3.986328125, -3.61328125, -3.240234375, -2.8671875, -2.494140625, -2.12109375, -1.748046875, -1.375, -1.001953125, -0.62890625, -0.255859375, 0.1171875, 0.490234375, 0.86328125, 1.236328125, 1.609375, 1.982421875, 2.35546875, 2.728515625, 3.1015625, 3.474609375, 3.84765625, 4.220703125, 4.59375, 4.966796875, 5.33984375, 5.712890625, 6.0859375, 6.458984375, 6.83203125, 7.205078125, 7.578125, 7.951171875, 8.32421875, 8.697265625, 9.0703125, 9.443359375, 9.81640625, 10.189453125, 10.5625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 14.0, 13.0, 12.0, 24.0, 35.0, 31.0, 55.0, 92.0, 91.0, 125.0, 195.0, 303.0, 472.0, 828.0, 1396.0, 2610.0, 5371.0, 12949.0, 42954.0, 442248.0, 2901188.0, 692827.0, 60820.0, 15952.0, 6480.0, 3049.0, 1582.0, 910.0, 530.0, 327.0, 234.0, 156.0, 100.0, 67.0, 48.0, 32.0, 28.0, 27.0, 21.0, 17.0, 11.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-29.03125, -28.19189453125, -27.3525390625, -26.51318359375, -25.673828125, -24.83447265625, -23.9951171875, -23.15576171875, -22.31640625, -21.47705078125, -20.6376953125, -19.79833984375, -18.958984375, -18.11962890625, -17.2802734375, -16.44091796875, -15.6015625, -14.76220703125, -13.9228515625, -13.08349609375, -12.244140625, -11.40478515625, -10.5654296875, -9.72607421875, -8.88671875, -8.04736328125, -7.2080078125, -6.36865234375, -5.529296875, -4.68994140625, -3.8505859375, -3.01123046875, -2.171875, -1.33251953125, -0.4931640625, 0.34619140625, 1.185546875, 2.02490234375, 2.8642578125, 3.70361328125, 4.54296875, 5.38232421875, 6.2216796875, 7.06103515625, 7.900390625, 8.73974609375, 9.5791015625, 10.41845703125, 11.2578125, 12.09716796875, 12.9365234375, 13.77587890625, 14.615234375, 15.45458984375, 16.2939453125, 17.13330078125, 17.97265625, 18.81201171875, 19.6513671875, 20.49072265625, 21.330078125, 22.16943359375, 23.0087890625, 23.84814453125, 24.6875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 6.0, 5.0, 11.0, 12.0, 6.0, 16.0, 17.0, 21.0, 32.0, 45.0, 51.0, 64.0, 79.0, 139.0, 201.0, 310.0, 549.0, 640.0, 610.0, 426.0, 243.0, 151.0, 91.0, 80.0, 60.0, 39.0, 37.0, 20.0, 16.0, 17.0, 12.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.747314453125, -20.07275390625, -19.398193359375, -18.7236328125, -18.049072265625, -17.37451171875, -16.699951171875, -16.025390625, -15.350830078125, -14.67626953125, -14.001708984375, -13.3271484375, -12.652587890625, -11.97802734375, -11.303466796875, -10.62890625, -9.954345703125, -9.27978515625, -8.605224609375, -7.9306640625, -7.256103515625, -6.58154296875, -5.906982421875, -5.232421875, -4.557861328125, -3.88330078125, -3.208740234375, -2.5341796875, -1.859619140625, -1.18505859375, -0.510498046875, 0.1640625, 0.838623046875, 1.51318359375, 2.187744140625, 2.8623046875, 3.536865234375, 4.21142578125, 4.885986328125, 5.560546875, 6.235107421875, 6.90966796875, 7.584228515625, 8.2587890625, 8.933349609375, 9.60791015625, 10.282470703125, 10.95703125, 11.631591796875, 12.30615234375, 12.980712890625, 13.6552734375, 14.329833984375, 15.00439453125, 15.678955078125, 16.353515625, 17.028076171875, 17.70263671875, 18.377197265625, 19.0517578125, 19.726318359375, 20.40087890625, 21.075439453125, 21.75]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 7.0, 8.0, 12.0, 17.0, 17.0, 26.0, 40.0, 52.0, 79.0, 105.0, 191.0, 467.0, 2148.0, 22950.0, 3268477.0, 883111.0, 14082.0, 1440.0, 416.0, 171.0, 108.0, 66.0, 65.0, 45.0, 23.0, 25.0, 20.0, 12.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.9560546875, -94.787109375, -91.6181640625, -88.44921875, -85.2802734375, -82.111328125, -78.9423828125, -75.7734375, -72.6044921875, -69.435546875, -66.2666015625, -63.09765625, -59.9287109375, -56.759765625, -53.5908203125, -50.421875, -47.2529296875, -44.083984375, -40.9150390625, -37.74609375, -34.5771484375, -31.408203125, -28.2392578125, -25.0703125, -21.9013671875, -18.732421875, -15.5634765625, -12.39453125, -9.2255859375, -6.056640625, -2.8876953125, 0.28125, 3.4501953125, 6.619140625, 9.7880859375, 12.95703125, 16.1259765625, 19.294921875, 22.4638671875, 25.6328125, 28.8017578125, 31.970703125, 35.1396484375, 38.30859375, 41.4775390625, 44.646484375, 47.8154296875, 50.984375, 54.1533203125, 57.322265625, 60.4912109375, 63.66015625, 66.8291015625, 69.998046875, 73.1669921875, 76.3359375, 79.5048828125, 82.673828125, 85.8427734375, 89.01171875, 92.1806640625, 95.349609375, 98.5185546875, 101.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 23.0, 83.0, 186.0, 327.0, 268.0, 78.0, 29.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.9048156738281, -404.8369140625, -395.76898193359375, -386.7010803222656, -377.6331481933594, -368.56524658203125, -359.497314453125, -350.4294128417969, -341.36151123046875, -332.2936096191406, -323.2256774902344, -314.15777587890625, -305.08984375, -296.0219421386719, -286.9540100097656, -277.8861083984375, -268.81817626953125, -259.7502746582031, -250.68234252929688, -241.6144256591797, -232.5465087890625, -223.47860717773438, -214.4106903076172, -205.3427734375, -196.2748565673828, -187.20693969726562, -178.13902282714844, -169.07110595703125, -160.00320434570312, -150.93527221679688, -141.86737060546875, -132.79945373535156, -123.73152160644531, -114.66360473632812, -105.59568786621094, -96.52777862548828, -87.4598617553711, -78.3919448852539, -69.32403564453125, -60.25611877441406, -51.188201904296875, -42.12028503417969, -33.052371978759766, -23.98445701599121, -14.916542053222656, -5.848625183105469, 3.219287872314453, 12.287200927734375, 21.355117797851562, 30.423032760620117, 39.49094772338867, 48.558860778808594, 57.62677764892578, 66.69469451904297, 75.76260375976562, 84.83052062988281, 93.8984375, 102.96635437011719, 112.03427124023438, 121.10218048095703, 130.17010498046875, 139.23800659179688, 148.30592346191406, 157.37384033203125, 166.44175720214844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 16.0, 16.0, 17.0, 22.0, 26.0, 27.0, 34.0, 25.0, 36.0, 34.0, 40.0, 63.0, 46.0, 64.0, 54.0, 38.0, 51.0, 42.0, 40.0, 38.0, 30.0, 41.0, 32.0, 24.0, 26.0, 21.0, 19.0, 10.0, 14.0, 7.0, 5.0, 4.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-102.3641586303711, -99.72129821777344, -97.07844543457031, -94.43558502197266, -91.792724609375, -89.14987182617188, -86.50701141357422, -83.86415100097656, -81.22129821777344, -78.57843780517578, -75.93558502197266, -73.292724609375, -70.64987182617188, -68.00701141357422, -65.36415100097656, -62.72129440307617, -60.07843780517578, -57.43558120727539, -54.792724609375, -52.149864196777344, -49.50700759887695, -46.86415100097656, -44.221290588378906, -41.578433990478516, -38.935577392578125, -36.292720794677734, -33.649864196777344, -31.007003784179688, -28.364147186279297, -25.721290588378906, -23.078432083129883, -20.43557357788086, -17.792709350585938, -15.14985179901123, -12.506994247436523, -9.864136695861816, -7.221279144287109, -4.578421592712402, -1.9355640411376953, 0.7072944641113281, 3.3501510620117188, 5.993008613586426, 8.635866165161133, 11.27872371673584, 13.921581268310547, 16.564437866210938, 19.20729637145996, 21.850154876708984, 24.493011474609375, 27.135868072509766, 29.77872657775879, 32.42158508300781, 35.0644416809082, 37.707298278808594, 40.35015869140625, 42.99301528930664, 45.63587188720703, 48.27872848510742, 50.92158508300781, 53.56444549560547, 56.20730209350586, 58.85015869140625, 61.493019104003906, 64.13587951660156, 66.77873229980469]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 7.0, 13.0, 38.0, 38.0, 70.0, 83.0, 119.0, 185.0, 288.0, 435.0, 612.0, 927.0, 1298.0, 2105.0, 2925.0, 4443.0, 6616.0, 10037.0, 15429.0, 23526.0, 36663.0, 57985.0, 94546.0, 162413.0, 228635.0, 152367.0, 90258.0, 54912.0, 35018.0, 22679.0, 14549.0, 9752.0, 6357.0, 4305.0, 2929.0, 1901.0, 1252.0, 919.0, 632.0, 421.0, 293.0, 185.0, 125.0, 82.0, 55.0, 44.0, 25.0, 20.0, 19.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2421875, -0.23423385620117188, -0.22628021240234375, -0.21832656860351562, -0.2103729248046875, -0.20241928100585938, -0.19446563720703125, -0.18651199340820312, -0.178558349609375, -0.17060470581054688, -0.16265106201171875, -0.15469741821289062, -0.1467437744140625, -0.13879013061523438, -0.13083648681640625, -0.12288284301757812, -0.11492919921875, -0.10697555541992188, -0.09902191162109375, -0.09106826782226562, -0.0831146240234375, -0.07516098022460938, -0.06720733642578125, -0.059253692626953125, -0.051300048828125, -0.043346405029296875, -0.03539276123046875, -0.027439117431640625, -0.0194854736328125, -0.011531829833984375, -0.00357818603515625, 0.004375457763671875, 0.0123291015625, 0.020282745361328125, 0.02823638916015625, 0.036190032958984375, 0.0441436767578125, 0.052097320556640625, 0.06005096435546875, 0.06800460815429688, 0.075958251953125, 0.08391189575195312, 0.09186553955078125, 0.09981918334960938, 0.1077728271484375, 0.11572647094726562, 0.12368011474609375, 0.13163375854492188, 0.13958740234375, 0.14754104614257812, 0.15549468994140625, 0.16344833374023438, 0.1714019775390625, 0.17935562133789062, 0.18730926513671875, 0.19526290893554688, 0.203216552734375, 0.21117019653320312, 0.21912384033203125, 0.22707748413085938, 0.2350311279296875, 0.24298477172851562, 0.25093841552734375, 0.2588920593261719, 0.266845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 9.0, 8.0, 14.0, 13.0, 15.0, 16.0, 15.0, 14.0, 20.0, 22.0, 30.0, 29.0, 36.0, 44.0, 41.0, 47.0, 39.0, 47.0, 42.0, 1073.0, 33.0, 51.0, 33.0, 32.0, 31.0, 32.0, 28.0, 28.0, 23.0, 19.0, 23.0, 28.0, 23.0, 15.0, 11.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.265625, -8.9947509765625, -8.723876953125, -8.4530029296875, -8.18212890625, -7.9112548828125, -7.640380859375, -7.3695068359375, -7.0986328125, -6.8277587890625, -6.556884765625, -6.2860107421875, -6.01513671875, -5.7442626953125, -5.473388671875, -5.2025146484375, -4.931640625, -4.6607666015625, -4.389892578125, -4.1190185546875, -3.84814453125, -3.5772705078125, -3.306396484375, -3.0355224609375, -2.7646484375, -2.4937744140625, -2.222900390625, -1.9520263671875, -1.68115234375, -1.4102783203125, -1.139404296875, -0.8685302734375, -0.59765625, -0.3267822265625, -0.055908203125, 0.2149658203125, 0.48583984375, 0.7567138671875, 1.027587890625, 1.2984619140625, 1.5693359375, 1.8402099609375, 2.111083984375, 2.3819580078125, 2.65283203125, 2.9237060546875, 3.194580078125, 3.4654541015625, 3.736328125, 4.0072021484375, 4.278076171875, 4.5489501953125, 4.81982421875, 5.0906982421875, 5.361572265625, 5.6324462890625, 5.9033203125, 6.1741943359375, 6.445068359375, 6.7159423828125, 6.98681640625, 7.2576904296875, 7.528564453125, 7.7994384765625, 8.0703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 13.0, 23.0, 29.0, 39.0, 64.0, 86.0, 101.0, 133.0, 204.0, 325.0, 452.0, 638.0, 959.0, 1282.0, 1958.0, 2712.0, 4097.0, 6002.0, 9216.0, 13708.0, 20504.0, 31385.0, 48777.0, 74989.0, 122619.0, 1209038.0, 222482.0, 116616.0, 72149.0, 46336.0, 30170.0, 19723.0, 12773.0, 8714.0, 5930.0, 4035.0, 2754.0, 1911.0, 1282.0, 882.0, 626.0, 426.0, 286.0, 212.0, 131.0, 102.0, 76.0, 54.0, 33.0, 24.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0], "bins": [-0.1263427734375, -0.12250804901123047, -0.11867332458496094, -0.1148386001586914, -0.11100387573242188, -0.10716915130615234, -0.10333442687988281, -0.09949970245361328, -0.09566497802734375, -0.09183025360107422, -0.08799552917480469, -0.08416080474853516, -0.08032608032226562, -0.0764913558959961, -0.07265663146972656, -0.06882190704345703, -0.0649871826171875, -0.06115245819091797, -0.05731773376464844, -0.053483009338378906, -0.049648284912109375, -0.045813560485839844, -0.04197883605957031, -0.03814411163330078, -0.03430938720703125, -0.03047466278076172, -0.026639938354492188, -0.022805213928222656, -0.018970489501953125, -0.015135765075683594, -0.011301040649414062, -0.007466316223144531, -0.003631591796875, 0.00020313262939453125, 0.0040378570556640625, 0.007872581481933594, 0.011707305908203125, 0.015542030334472656, 0.019376754760742188, 0.02321147918701172, 0.02704620361328125, 0.03088092803955078, 0.03471565246582031, 0.038550376892089844, 0.042385101318359375, 0.046219825744628906, 0.05005455017089844, 0.05388927459716797, 0.0577239990234375, 0.06155872344970703, 0.06539344787597656, 0.0692281723022461, 0.07306289672851562, 0.07689762115478516, 0.08073234558105469, 0.08456707000732422, 0.08840179443359375, 0.09223651885986328, 0.09607124328613281, 0.09990596771240234, 0.10374069213867188, 0.1075754165649414, 0.11141014099121094, 0.11524486541748047, 0.11907958984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 13.0, 7.0, 16.0, 17.0, 24.0, 13.0, 40.0, 33.0, 42.0, 46.0, 57.0, 51.0, 53.0, 79.0, 55.0, 62.0, 61.0, 51.0, 51.0, 28.0, 30.0, 20.0, 22.0, 21.0, 23.0, 20.0, 7.0, 9.0, 7.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007834434509277344, -0.0007560700178146362, -0.0007286965847015381, -0.0007013231515884399, -0.0006739497184753418, -0.0006465762853622437, -0.0006192028522491455, -0.0005918294191360474, -0.0005644559860229492, -0.0005370825529098511, -0.0005097091197967529, -0.0004823356866836548, -0.00045496225357055664, -0.0004275888204574585, -0.00040021538734436035, -0.0003728419542312622, -0.00034546852111816406, -0.0003180950880050659, -0.0002907216548919678, -0.00026334822177886963, -0.00023597478866577148, -0.00020860135555267334, -0.0001812279224395752, -0.00015385448932647705, -0.0001264810562133789, -9.910762310028076e-05, -7.173418998718262e-05, -4.436075687408447e-05, -1.6987323760986328e-05, 1.0386109352111816e-05, 3.775954246520996e-05, 6.51329755783081e-05, 9.250640869140625e-05, 0.0001198798418045044, 0.00014725327491760254, 0.00017462670803070068, 0.00020200014114379883, 0.00022937357425689697, 0.0002567470073699951, 0.00028412044048309326, 0.0003114938735961914, 0.00033886730670928955, 0.0003662407398223877, 0.00039361417293548584, 0.000420987606048584, 0.00044836103916168213, 0.0004757344722747803, 0.0005031079053878784, 0.0005304813385009766, 0.0005578547716140747, 0.0005852282047271729, 0.000612601637840271, 0.0006399750709533691, 0.0006673485040664673, 0.0006947219371795654, 0.0007220953702926636, 0.0007494688034057617, 0.0007768422365188599, 0.000804215669631958, 0.0008315891027450562, 0.0008589625358581543, 0.0008863359689712524, 0.0009137094020843506, 0.0009410828351974487, 0.0009684562683105469]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 3.0, 10.0, 9.0, 13.0, 27.0, 14.0, 31.0, 22.0, 32.0, 28.0, 64.0, 95.0, 194.0, 506.0, 4028.0, 1033124.0, 9130.0, 632.0, 205.0, 98.0, 58.0, 45.0, 48.0, 16.0, 24.0, 16.0, 15.0, 9.0, 11.0, 8.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0225067138671875, -0.021874189376831055, -0.02124166488647461, -0.020609140396118164, -0.01997661590576172, -0.019344091415405273, -0.018711566925048828, -0.018079042434692383, -0.017446517944335938, -0.016813993453979492, -0.016181468963623047, -0.015548944473266602, -0.014916419982910156, -0.014283895492553711, -0.013651371002197266, -0.01301884651184082, -0.012386322021484375, -0.01175379753112793, -0.011121273040771484, -0.010488748550415039, -0.009856224060058594, -0.009223699569702148, -0.008591175079345703, -0.007958650588989258, -0.0073261260986328125, -0.006693601608276367, -0.006061077117919922, -0.0054285526275634766, -0.004796028137207031, -0.004163503646850586, -0.0035309791564941406, -0.0028984546661376953, -0.00226593017578125, -0.0016334056854248047, -0.0010008811950683594, -0.00036835670471191406, 0.00026416778564453125, 0.0008966922760009766, 0.0015292167663574219, 0.002161741256713867, 0.0027942657470703125, 0.003426790237426758, 0.004059314727783203, 0.0046918392181396484, 0.005324363708496094, 0.005956888198852539, 0.006589412689208984, 0.00722193717956543, 0.007854461669921875, 0.00848698616027832, 0.009119510650634766, 0.009752035140991211, 0.010384559631347656, 0.011017084121704102, 0.011649608612060547, 0.012282133102416992, 0.012914657592773438, 0.013547182083129883, 0.014179706573486328, 0.014812231063842773, 0.015444755554199219, 0.016077280044555664, 0.01670980453491211, 0.017342329025268555, 0.017974853515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 305.0, 707.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022845227271318436, -0.02241465635597706, -0.02198408544063568, -0.021553512662649155, -0.021122941747307777, -0.0206923708319664, -0.020261799916625023, -0.019831229001283646, -0.01940065808594227, -0.01897008717060089, -0.018539516255259514, -0.018108945339918137, -0.01767837256193161, -0.017247801646590233, -0.016817230731248856, -0.01638665981590748, -0.0159560889005661, -0.015525517985224724, -0.015094946138560772, -0.014664375223219395, -0.014233804307878017, -0.013803232461214066, -0.013372661545872688, -0.012942090630531311, -0.012511517852544785, -0.012080946937203407, -0.011650375090539455, -0.011219804175198078, -0.010789233259856701, -0.010358661413192749, -0.009928090497851372, -0.009497519582509995, -0.009066947735846043, -0.008636376820504665, -0.008205804973840714, -0.007775234058499336, -0.007344663143157959, -0.006914091762155294, -0.00648352038115263, -0.006052949465811253, -0.005622378084808588, -0.0051918067038059235, -0.004761235788464546, -0.004330664407461882, -0.0039000932592898607, -0.00346952211111784, -0.0030389507301151752, -0.0026083795819431543, -0.0021778084337711334, -0.0017472372855991125, -0.0013166660210117698, -0.000886094756424427, -0.0004555236082524061, -2.4952460080385208e-05, 0.00040561892092227936, 0.0008361900690943003, 0.0012667612172663212, 0.001697332365438342, 0.002127903513610363, 0.0025584748946130276, 0.0029890460427850485, 0.0034196171909570694, 0.003850188571959734, 0.0042807599529623985, 0.004711330868303776]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 13.0, 16.0, 9.0, 22.0, 25.0, 22.0, 30.0, 41.0, 31.0, 39.0, 54.0, 34.0, 63.0, 53.0, 39.0, 52.0, 55.0, 54.0, 33.0, 30.0, 41.0, 32.0, 35.0, 20.0, 20.0, 27.0, 19.0, 19.0, 17.0, 9.0, 12.0, 4.0, 7.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007668137550354004, -0.0007376745343208313, -0.0007085353136062622, -0.0006793960928916931, -0.000650256872177124, -0.0006211176514625549, -0.0005919784307479858, -0.0005628392100334167, -0.0005336999893188477, -0.0005045607686042786, -0.00047542154788970947, -0.0004462823271751404, -0.0004171431064605713, -0.0003880038857460022, -0.0003588646650314331, -0.000329725444316864, -0.0003005862236022949, -0.00027144700288772583, -0.00024230778217315674, -0.00021316856145858765, -0.00018402934074401855, -0.00015489012002944946, -0.00012575089931488037, -9.661167860031128e-05, -6.747245788574219e-05, -3.8333237171173096e-05, -9.194016456604004e-06, 1.9945204257965088e-05, 4.908442497253418e-05, 7.822364568710327e-05, 0.00010736286640167236, 0.00013650208711624146, 0.00016564130783081055, 0.00019478052854537964, 0.00022391974925994873, 0.0002530589699745178, 0.0002821981906890869, 0.000311337411403656, 0.0003404766321182251, 0.0003696158528327942, 0.0003987550735473633, 0.0004278942942619324, 0.00045703351497650146, 0.00048617273569107056, 0.0005153119564056396, 0.0005444511771202087, 0.0005735903978347778, 0.0006027296185493469, 0.000631868839263916, 0.0006610080599784851, 0.0006901472806930542, 0.0007192865014076233, 0.0007484257221221924, 0.0007775649428367615, 0.0008067041635513306, 0.0008358433842658997, 0.0008649826049804688, 0.0008941218256950378, 0.0009232610464096069, 0.000952400267124176, 0.0009815394878387451, 0.0010106787085533142, 0.0010398179292678833, 0.0010689571499824524, 0.0010980963706970215]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 11.0, 11.0, 19.0, 23.0, 45.0, 54.0, 79.0, 106.0, 149.0, 172.0, 232.0, 339.0, 483.0, 698.0, 1030.0, 1402.0, 2091.0, 3260.0, 4902.0, 8415.0, 16188.0, 39790.0, 139154.0, 623795.0, 129454.0, 37939.0, 15742.0, 8023.0, 4955.0, 3124.0, 2086.0, 1351.0, 961.0, 699.0, 482.0, 352.0, 231.0, 187.0, 141.0, 91.0, 76.0, 43.0, 35.0, 31.0, 20.0, 18.0, 19.0, 4.0, 14.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.3984375, -12.9727783203125, -12.547119140625, -12.1214599609375, -11.69580078125, -11.2701416015625, -10.844482421875, -10.4188232421875, -9.9931640625, -9.5675048828125, -9.141845703125, -8.7161865234375, -8.29052734375, -7.8648681640625, -7.439208984375, -7.0135498046875, -6.587890625, -6.1622314453125, -5.736572265625, -5.3109130859375, -4.88525390625, -4.4595947265625, -4.033935546875, -3.6082763671875, -3.1826171875, -2.7569580078125, -2.331298828125, -1.9056396484375, -1.47998046875, -1.0543212890625, -0.628662109375, -0.2030029296875, 0.22265625, 0.6483154296875, 1.073974609375, 1.4996337890625, 1.92529296875, 2.3509521484375, 2.776611328125, 3.2022705078125, 3.6279296875, 4.0535888671875, 4.479248046875, 4.9049072265625, 5.33056640625, 5.7562255859375, 6.181884765625, 6.6075439453125, 7.033203125, 7.4588623046875, 7.884521484375, 8.3101806640625, 8.73583984375, 9.1614990234375, 9.587158203125, 10.0128173828125, 10.4384765625, 10.8641357421875, 11.289794921875, 11.7154541015625, 12.14111328125, 12.5667724609375, 12.992431640625, 13.4180908203125, 13.84375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 14.0, 9.0, 19.0, 20.0, 21.0, 21.0, 19.0, 30.0, 21.0, 33.0, 42.0, 38.0, 50.0, 50.0, 91.0, 177.0, 1736.0, 150.0, 68.0, 48.0, 48.0, 35.0, 39.0, 36.0, 25.0, 31.0, 29.0, 26.0, 23.0, 18.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.73095703125, -35.5244140625, -34.31787109375, -33.111328125, -31.90478515625, -30.6982421875, -29.49169921875, -28.28515625, -27.07861328125, -25.8720703125, -24.66552734375, -23.458984375, -22.25244140625, -21.0458984375, -19.83935546875, -18.6328125, -17.42626953125, -16.2197265625, -15.01318359375, -13.806640625, -12.60009765625, -11.3935546875, -10.18701171875, -8.98046875, -7.77392578125, -6.5673828125, -5.36083984375, -4.154296875, -2.94775390625, -1.7412109375, -0.53466796875, 0.671875, 1.87841796875, 3.0849609375, 4.29150390625, 5.498046875, 6.70458984375, 7.9111328125, 9.11767578125, 10.32421875, 11.53076171875, 12.7373046875, 13.94384765625, 15.150390625, 16.35693359375, 17.5634765625, 18.77001953125, 19.9765625, 21.18310546875, 22.3896484375, 23.59619140625, 24.802734375, 26.00927734375, 27.2158203125, 28.42236328125, 29.62890625, 30.83544921875, 32.0419921875, 33.24853515625, 34.455078125, 35.66162109375, 36.8681640625, 38.07470703125, 39.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 14.0, 17.0, 21.0, 29.0, 31.0, 34.0, 45.0, 50.0, 91.0, 140.0, 146.0, 229.0, 645.0, 2103.0, 13423.0, 2467508.0, 647140.0, 10784.0, 1814.0, 515.0, 238.0, 146.0, 115.0, 86.0, 49.0, 48.0, 39.0, 37.0, 31.0, 35.0, 11.0, 9.0, 13.0, 10.0, 8.0, 4.0, 7.0, 5.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.8125, -86.271484375, -83.73046875, -81.189453125, -78.6484375, -76.107421875, -73.56640625, -71.025390625, -68.484375, -65.943359375, -63.40234375, -60.861328125, -58.3203125, -55.779296875, -53.23828125, -50.697265625, -48.15625, -45.615234375, -43.07421875, -40.533203125, -37.9921875, -35.451171875, -32.91015625, -30.369140625, -27.828125, -25.287109375, -22.74609375, -20.205078125, -17.6640625, -15.123046875, -12.58203125, -10.041015625, -7.5, -4.958984375, -2.41796875, 0.123046875, 2.6640625, 5.205078125, 7.74609375, 10.287109375, 12.828125, 15.369140625, 17.91015625, 20.451171875, 22.9921875, 25.533203125, 28.07421875, 30.615234375, 33.15625, 35.697265625, 38.23828125, 40.779296875, 43.3203125, 45.861328125, 48.40234375, 50.943359375, 53.484375, 56.025390625, 58.56640625, 61.107421875, 63.6484375, 66.189453125, 68.73046875, 71.271484375, 73.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 42.0, 218.0, 542.0, 161.0, 36.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.95651245117188, -108.3705062866211, -101.78450012207031, -95.19850158691406, -88.61249542236328, -82.0264892578125, -75.44048309326172, -68.85447692871094, -62.26847457885742, -55.68246841430664, -49.096466064453125, -42.510459899902344, -35.92445373535156, -29.338451385498047, -22.752445220947266, -16.16644287109375, -9.580436706542969, -2.994431972503662, 3.5915727615356445, 10.17757797241211, 16.763582229614258, 23.349586486816406, 29.935592651367188, 36.5215950012207, 43.107601165771484, 49.693607330322266, 56.27960968017578, 62.86561584472656, 69.45162200927734, 76.03762817382812, 82.62362670898438, 89.20963287353516, 95.79563903808594, 102.38164520263672, 108.9676513671875, 115.55364990234375, 122.13965606689453, 128.7256622314453, 135.31167602539062, 141.89767456054688, 148.48367309570312, 155.06967163085938, 161.6556854248047, 168.24168395996094, 174.82769775390625, 181.4136962890625, 187.99969482421875, 194.58570861816406, 201.17172241210938, 207.75772094726562, 214.34373474121094, 220.9297332763672, 227.5157470703125, 234.10174560546875, 240.687744140625, 247.2737579345703, 253.85975646972656, 260.4457702636719, 267.0317687988281, 273.6177673339844, 280.2037658691406, 286.789794921875, 293.37579345703125, 299.9617919921875, 306.54779052734375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 6.0, 11.0, 14.0, 11.0, 8.0, 7.0, 14.0, 12.0, 39.0, 31.0, 39.0, 25.0, 37.0, 41.0, 44.0, 44.0, 42.0, 43.0, 43.0, 43.0, 35.0, 41.0, 35.0, 47.0, 27.0, 38.0, 35.0, 18.0, 21.0, 18.0, 22.0, 13.0, 18.0, 17.0, 11.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.6780776977539, -85.90892791748047, -83.13977813720703, -80.37063598632812, -77.60148620605469, -74.83233642578125, -72.06318664550781, -69.29403686523438, -66.52489471435547, -63.75574493408203, -60.98659896850586, -58.21744918823242, -55.44830322265625, -52.67915344238281, -49.910003662109375, -47.1408576965332, -44.371707916259766, -41.60255813598633, -38.833412170410156, -36.06426239013672, -33.29511642456055, -30.52596664428711, -27.756818771362305, -24.9876708984375, -22.218523025512695, -19.44937515258789, -16.680227279663086, -13.911078453063965, -11.14193058013916, -8.372782707214355, -5.603633880615234, -2.8344860076904297, -0.065338134765625, 2.703809976577759, 5.472958087921143, 8.242106437683105, 11.01125431060791, 13.780402183532715, 16.549551010131836, 19.31869888305664, 22.087846755981445, 24.85699462890625, 27.626142501831055, 30.39529037475586, 33.1644401550293, 35.93358612060547, 38.702735900878906, 41.471885681152344, 44.241031646728516, 47.01018142700195, 49.779327392578125, 52.54847717285156, 55.317623138427734, 58.08677291870117, 60.855918884277344, 63.62506866455078, 66.39421844482422, 69.16336822509766, 71.9325180053711, 74.70166015625, 77.47080993652344, 80.23995971679688, 83.00910949707031, 85.77825927734375, 88.54740142822266]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 6.0, 15.0, 14.0, 16.0, 16.0, 18.0, 15.0, 26.0, 25.0, 34.0, 44.0, 44.0, 45.0, 47.0, 46.0, 34.0, 51.0, 50.0, 46.0, 38.0, 34.0, 41.0, 47.0, 39.0, 29.0, 30.0, 23.0, 25.0, 11.0, 15.0, 11.0, 9.0, 8.0, 3.0, 9.0, 5.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.604736328125, -11.21728515625, -10.829833984375, -10.4423828125, -10.054931640625, -9.66748046875, -9.280029296875, -8.892578125, -8.505126953125, -8.11767578125, -7.730224609375, -7.3427734375, -6.955322265625, -6.56787109375, -6.180419921875, -5.79296875, -5.405517578125, -5.01806640625, -4.630615234375, -4.2431640625, -3.855712890625, -3.46826171875, -3.080810546875, -2.693359375, -2.305908203125, -1.91845703125, -1.531005859375, -1.1435546875, -0.756103515625, -0.36865234375, 0.018798828125, 0.40625, 0.793701171875, 1.18115234375, 1.568603515625, 1.9560546875, 2.343505859375, 2.73095703125, 3.118408203125, 3.505859375, 3.893310546875, 4.28076171875, 4.668212890625, 5.0556640625, 5.443115234375, 5.83056640625, 6.218017578125, 6.60546875, 6.992919921875, 7.38037109375, 7.767822265625, 8.1552734375, 8.542724609375, 8.93017578125, 9.317626953125, 9.705078125, 10.092529296875, 10.47998046875, 10.867431640625, 11.2548828125, 11.642333984375, 12.02978515625, 12.417236328125, 12.8046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 13.0, 20.0, 21.0, 20.0, 26.0, 34.0, 64.0, 78.0, 139.0, 218.0, 429.0, 935.0, 2282.0, 6164.0, 19801.0, 146059.0, 3074374.0, 883168.0, 42907.0, 10812.0, 3701.0, 1376.0, 688.0, 365.0, 181.0, 113.0, 62.0, 59.0, 40.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 9.0, 7.0, 4.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.85986328125, -33.6884765625, -32.51708984375, -31.345703125, -30.17431640625, -29.0029296875, -27.83154296875, -26.66015625, -25.48876953125, -24.3173828125, -23.14599609375, -21.974609375, -20.80322265625, -19.6318359375, -18.46044921875, -17.2890625, -16.11767578125, -14.9462890625, -13.77490234375, -12.603515625, -11.43212890625, -10.2607421875, -9.08935546875, -7.91796875, -6.74658203125, -5.5751953125, -4.40380859375, -3.232421875, -2.06103515625, -0.8896484375, 0.28173828125, 1.453125, 2.62451171875, 3.7958984375, 4.96728515625, 6.138671875, 7.31005859375, 8.4814453125, 9.65283203125, 10.82421875, 11.99560546875, 13.1669921875, 14.33837890625, 15.509765625, 16.68115234375, 17.8525390625, 19.02392578125, 20.1953125, 21.36669921875, 22.5380859375, 23.70947265625, 24.880859375, 26.05224609375, 27.2236328125, 28.39501953125, 29.56640625, 30.73779296875, 31.9091796875, 33.08056640625, 34.251953125, 35.42333984375, 36.5947265625, 37.76611328125, 38.9375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 7.0, 8.0, 17.0, 19.0, 15.0, 27.0, 30.0, 31.0, 53.0, 75.0, 101.0, 126.0, 261.0, 485.0, 740.0, 748.0, 520.0, 302.0, 144.0, 103.0, 65.0, 40.0, 37.0, 23.0, 21.0, 10.0, 15.0, 9.0, 9.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.78125, -25.001708984375, -24.22216796875, -23.442626953125, -22.6630859375, -21.883544921875, -21.10400390625, -20.324462890625, -19.544921875, -18.765380859375, -17.98583984375, -17.206298828125, -16.4267578125, -15.647216796875, -14.86767578125, -14.088134765625, -13.30859375, -12.529052734375, -11.74951171875, -10.969970703125, -10.1904296875, -9.410888671875, -8.63134765625, -7.851806640625, -7.072265625, -6.292724609375, -5.51318359375, -4.733642578125, -3.9541015625, -3.174560546875, -2.39501953125, -1.615478515625, -0.8359375, -0.056396484375, 0.72314453125, 1.502685546875, 2.2822265625, 3.061767578125, 3.84130859375, 4.620849609375, 5.400390625, 6.179931640625, 6.95947265625, 7.739013671875, 8.5185546875, 9.298095703125, 10.07763671875, 10.857177734375, 11.63671875, 12.416259765625, 13.19580078125, 13.975341796875, 14.7548828125, 15.534423828125, 16.31396484375, 17.093505859375, 17.873046875, 18.652587890625, 19.43212890625, 20.211669921875, 20.9912109375, 21.770751953125, 22.55029296875, 23.329833984375, 24.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 12.0, 13.0, 22.0, 25.0, 29.0, 51.0, 76.0, 142.0, 309.0, 1206.0, 13398.0, 3166538.0, 1001611.0, 9165.0, 966.0, 221.0, 145.0, 84.0, 56.0, 36.0, 29.0, 32.0, 19.0, 16.0, 15.0, 10.0, 8.0, 1.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.375, -113.5810546875, -109.787109375, -105.9931640625, -102.19921875, -98.4052734375, -94.611328125, -90.8173828125, -87.0234375, -83.2294921875, -79.435546875, -75.6416015625, -71.84765625, -68.0537109375, -64.259765625, -60.4658203125, -56.671875, -52.8779296875, -49.083984375, -45.2900390625, -41.49609375, -37.7021484375, -33.908203125, -30.1142578125, -26.3203125, -22.5263671875, -18.732421875, -14.9384765625, -11.14453125, -7.3505859375, -3.556640625, 0.2373046875, 4.03125, 7.8251953125, 11.619140625, 15.4130859375, 19.20703125, 23.0009765625, 26.794921875, 30.5888671875, 34.3828125, 38.1767578125, 41.970703125, 45.7646484375, 49.55859375, 53.3525390625, 57.146484375, 60.9404296875, 64.734375, 68.5283203125, 72.322265625, 76.1162109375, 79.91015625, 83.7041015625, 87.498046875, 91.2919921875, 95.0859375, 98.8798828125, 102.673828125, 106.4677734375, 110.26171875, 114.0556640625, 117.849609375, 121.6435546875, 125.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 23.0, 57.0, 90.0, 157.0, 195.0, 201.0, 145.0, 75.0, 27.0, 19.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.41262817382812, -127.2995834350586, -122.1865463256836, -117.07350158691406, -111.96046447753906, -106.84741973876953, -101.734375, -96.621337890625, -91.50829315185547, -86.39524841308594, -81.28221130371094, -76.1691665649414, -71.05612182617188, -65.94308471679688, -60.830039978027344, -55.71699905395508, -50.60395812988281, -45.49091720581055, -40.37787628173828, -35.26483154296875, -30.151790618896484, -25.03874969482422, -19.92570686340332, -14.812664031982422, -9.699623107910156, -4.586581230163574, 0.5264606475830078, 5.63950252532959, 10.752544403076172, 15.865585327148438, 20.978628158569336, 26.091670989990234, 31.204696655273438, 36.3177375793457, 41.43077850341797, 46.5438232421875, 51.656864166259766, 56.76990509033203, 61.88294982910156, 66.99598693847656, 72.1090316772461, 77.22207641601562, 82.33511352539062, 87.44815826416016, 92.56120300292969, 97.67424011230469, 102.78728485107422, 107.90032958984375, 113.01336669921875, 118.12641143798828, 123.23944854736328, 128.3524932861328, 133.4655303955078, 138.57858276367188, 143.69161987304688, 148.80465698242188, 153.91769409179688, 159.03073120117188, 164.14378356933594, 169.25682067871094, 174.36985778808594, 179.48291015625, 184.595947265625, 189.708984375, 194.82203674316406]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 14.0, 16.0, 24.0, 22.0, 29.0, 35.0, 32.0, 40.0, 27.0, 39.0, 41.0, 50.0, 49.0, 39.0, 57.0, 45.0, 37.0, 48.0, 38.0, 28.0, 38.0, 37.0, 29.0, 29.0, 21.0, 18.0, 12.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.47439575195312, -73.06916046142578, -70.66392517089844, -68.25869750976562, -65.85346221923828, -63.44822692871094, -61.042991638183594, -58.63775634765625, -56.23252487182617, -53.82728958129883, -51.42205810546875, -49.016822814941406, -46.61158752441406, -44.206356048583984, -41.80112075805664, -39.39588928222656, -36.99065399169922, -34.585418701171875, -32.1801872253418, -29.774951934814453, -27.369718551635742, -24.96448516845703, -22.559249877929688, -20.154016494750977, -17.748783111572266, -15.343549728393555, -12.938315391540527, -10.5330810546875, -8.127847671508789, -5.722614288330078, -3.317379951477051, -0.9121456146240234, 1.4930877685546875, 3.8983216285705566, 6.303555488586426, 8.708789825439453, 11.114023208618164, 13.519256591796875, 15.924490928649902, 18.32972526550293, 20.73495864868164, 23.14019203186035, 25.545425415039062, 27.950660705566406, 30.355894088745117, 32.76112747192383, 35.16636276245117, 37.57159423828125, 39.976829528808594, 42.38206481933594, 44.787296295166016, 47.19253158569336, 49.59776306152344, 52.00299835205078, 54.408233642578125, 56.81346893310547, 59.21870040893555, 61.62393569946289, 64.02916717529297, 66.43440246582031, 68.83963775634766, 71.244873046875, 73.65010070800781, 76.05533599853516, 78.4605712890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 5.0, 7.0, 6.0, 10.0, 21.0, 16.0, 24.0, 33.0, 53.0, 71.0, 95.0, 142.0, 201.0, 291.0, 405.0, 548.0, 774.0, 1119.0, 1524.0, 2302.0, 3233.0, 4731.0, 6505.0, 9760.0, 14520.0, 21567.0, 32333.0, 49374.0, 75475.0, 116719.0, 186003.0, 183837.0, 115538.0, 74450.0, 48511.0, 31814.0, 21155.0, 14196.0, 9511.0, 6533.0, 4583.0, 3167.0, 2176.0, 1509.0, 1064.0, 790.0, 559.0, 368.0, 272.0, 174.0, 151.0, 111.0, 68.0, 38.0, 41.0, 28.0, 19.0, 18.0, 9.0, 7.0, 5.0, 2.0], "bins": [-0.2447509765625, -0.23732948303222656, -0.22990798950195312, -0.2224864959716797, -0.21506500244140625, -0.2076435089111328, -0.20022201538085938, -0.19280052185058594, -0.1853790283203125, -0.17795753479003906, -0.17053604125976562, -0.1631145477294922, -0.15569305419921875, -0.1482715606689453, -0.14085006713867188, -0.13342857360839844, -0.126007080078125, -0.11858558654785156, -0.11116409301757812, -0.10374259948730469, -0.09632110595703125, -0.08889961242675781, -0.08147811889648438, -0.07405662536621094, -0.0666351318359375, -0.05921363830566406, -0.051792144775390625, -0.04437065124511719, -0.03694915771484375, -0.029527664184570312, -0.022106170654296875, -0.014684677124023438, -0.00726318359375, 0.0001583099365234375, 0.007579803466796875, 0.015001296997070312, 0.02242279052734375, 0.029844284057617188, 0.037265777587890625, 0.04468727111816406, 0.0521087646484375, 0.05953025817871094, 0.06695175170898438, 0.07437324523925781, 0.08179473876953125, 0.08921623229980469, 0.09663772583007812, 0.10405921936035156, 0.111480712890625, 0.11890220642089844, 0.12632369995117188, 0.1337451934814453, 0.14116668701171875, 0.1485881805419922, 0.15600967407226562, 0.16343116760253906, 0.1708526611328125, 0.17827415466308594, 0.18569564819335938, 0.1931171417236328, 0.20053863525390625, 0.2079601287841797, 0.21538162231445312, 0.22280311584472656, 0.230224609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 7.0, 9.0, 13.0, 23.0, 20.0, 23.0, 36.0, 25.0, 29.0, 43.0, 30.0, 45.0, 29.0, 35.0, 45.0, 1067.0, 49.0, 52.0, 39.0, 46.0, 41.0, 35.0, 35.0, 22.0, 38.0, 18.0, 27.0, 27.0, 16.0, 20.0, 13.0, 14.0, 10.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9605712890625, -7.671142578125, -7.3817138671875, -7.09228515625, -6.8028564453125, -6.513427734375, -6.2239990234375, -5.9345703125, -5.6451416015625, -5.355712890625, -5.0662841796875, -4.77685546875, -4.4874267578125, -4.197998046875, -3.9085693359375, -3.619140625, -3.3297119140625, -3.040283203125, -2.7508544921875, -2.46142578125, -2.1719970703125, -1.882568359375, -1.5931396484375, -1.3037109375, -1.0142822265625, -0.724853515625, -0.4354248046875, -0.14599609375, 0.1434326171875, 0.432861328125, 0.7222900390625, 1.01171875, 1.3011474609375, 1.590576171875, 1.8800048828125, 2.16943359375, 2.4588623046875, 2.748291015625, 3.0377197265625, 3.3271484375, 3.6165771484375, 3.906005859375, 4.1954345703125, 4.48486328125, 4.7742919921875, 5.063720703125, 5.3531494140625, 5.642578125, 5.9320068359375, 6.221435546875, 6.5108642578125, 6.80029296875, 7.0897216796875, 7.379150390625, 7.6685791015625, 7.9580078125, 8.2474365234375, 8.536865234375, 8.8262939453125, 9.11572265625, 9.4051513671875, 9.694580078125, 9.9840087890625, 10.2734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 9.0, 23.0, 33.0, 70.0, 78.0, 118.0, 152.0, 250.0, 358.0, 491.0, 809.0, 1132.0, 1786.0, 2546.0, 3868.0, 6008.0, 9198.0, 14203.0, 21965.0, 34272.0, 53427.0, 84543.0, 139063.0, 1259097.0, 173519.0, 106158.0, 66261.0, 41833.0, 26542.0, 17115.0, 10950.0, 7101.0, 4689.0, 3031.0, 2082.0, 1374.0, 949.0, 629.0, 448.0, 294.0, 207.0, 146.0, 96.0, 64.0, 44.0, 34.0, 19.0, 11.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1217041015625, -0.11761093139648438, -0.11351776123046875, -0.10942459106445312, -0.1053314208984375, -0.10123825073242188, -0.09714508056640625, -0.09305191040039062, -0.088958740234375, -0.08486557006835938, -0.08077239990234375, -0.07667922973632812, -0.0725860595703125, -0.06849288940429688, -0.06439971923828125, -0.060306549072265625, -0.05621337890625, -0.052120208740234375, -0.04802703857421875, -0.043933868408203125, -0.0398406982421875, -0.035747528076171875, -0.03165435791015625, -0.027561187744140625, -0.023468017578125, -0.019374847412109375, -0.01528167724609375, -0.011188507080078125, -0.0070953369140625, -0.003002166748046875, 0.00109100341796875, 0.005184173583984375, 0.00927734375, 0.013370513916015625, 0.01746368408203125, 0.021556854248046875, 0.0256500244140625, 0.029743194580078125, 0.03383636474609375, 0.037929534912109375, 0.042022705078125, 0.046115875244140625, 0.05020904541015625, 0.054302215576171875, 0.0583953857421875, 0.062488555908203125, 0.06658172607421875, 0.07067489624023438, 0.07476806640625, 0.07886123657226562, 0.08295440673828125, 0.08704757690429688, 0.0911407470703125, 0.09523391723632812, 0.09932708740234375, 0.10342025756835938, 0.107513427734375, 0.11160659790039062, 0.11569976806640625, 0.11979293823242188, 0.1238861083984375, 0.12797927856445312, 0.13207244873046875, 0.13616561889648438, 0.1402587890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 3.0, 14.0, 12.0, 19.0, 13.0, 24.0, 31.0, 44.0, 45.0, 71.0, 96.0, 85.0, 100.0, 76.0, 70.0, 64.0, 33.0, 42.0, 28.0, 20.0, 23.0, 16.0, 12.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011749267578125, -0.0011394768953323364, -0.0011040270328521729, -0.0010685771703720093, -0.0010331273078918457, -0.0009976774454116821, -0.0009622275829315186, -0.000926777720451355, -0.0008913278579711914, -0.0008558779954910278, -0.0008204281330108643, -0.0007849782705307007, -0.0007495284080505371, -0.0007140785455703735, -0.00067862868309021, -0.0006431788206100464, -0.0006077289581298828, -0.0005722790956497192, -0.0005368292331695557, -0.0005013793706893921, -0.0004659295082092285, -0.00043047964572906494, -0.00039502978324890137, -0.0003595799207687378, -0.0003241300582885742, -0.00028868019580841064, -0.00025323033332824707, -0.0002177804708480835, -0.00018233060836791992, -0.00014688074588775635, -0.00011143088340759277, -7.59810209274292e-05, -4.0531158447265625e-05, -5.081295967102051e-06, 3.0368566513061523e-05, 6.58184289932251e-05, 0.00010126829147338867, 0.00013671815395355225, 0.00017216801643371582, 0.0002076178789138794, 0.00024306774139404297, 0.00027851760387420654, 0.0003139674663543701, 0.0003494173288345337, 0.00038486719131469727, 0.00042031705379486084, 0.0004557669162750244, 0.000491216778755188, 0.0005266666412353516, 0.0005621165037155151, 0.0005975663661956787, 0.0006330162286758423, 0.0006684660911560059, 0.0007039159536361694, 0.000739365816116333, 0.0007748156785964966, 0.0008102655410766602, 0.0008457154035568237, 0.0008811652660369873, 0.0009166151285171509, 0.0009520649909973145, 0.000987514853477478, 0.0010229647159576416, 0.0010584145784378052, 0.0010938644409179688]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 7.0, 11.0, 12.0, 17.0, 21.0, 23.0, 29.0, 52.0, 54.0, 121.0, 276.0, 1337.0, 1016373.0, 29138.0, 600.0, 183.0, 79.0, 55.0, 36.0, 23.0, 16.0, 19.0, 11.0, 15.0, 2.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255584716796875, -0.02472853660583496, -0.023898601531982422, -0.023068666458129883, -0.022238731384277344, -0.021408796310424805, -0.020578861236572266, -0.019748926162719727, -0.018918991088867188, -0.01808905601501465, -0.01725912094116211, -0.01642918586730957, -0.015599250793457031, -0.014769315719604492, -0.013939380645751953, -0.013109445571899414, -0.012279510498046875, -0.011449575424194336, -0.010619640350341797, -0.009789705276489258, -0.008959770202636719, -0.00812983512878418, -0.007299900054931641, -0.0064699649810791016, -0.0056400299072265625, -0.0048100948333740234, -0.003980159759521484, -0.0031502246856689453, -0.0023202896118164062, -0.0014903545379638672, -0.0006604194641113281, 0.00016951560974121094, 0.00099945068359375, 0.001829385757446289, 0.002659320831298828, 0.003489255905151367, 0.004319190979003906, 0.005149126052856445, 0.005979061126708984, 0.0068089962005615234, 0.0076389312744140625, 0.008468866348266602, 0.00929880142211914, 0.01012873649597168, 0.010958671569824219, 0.011788606643676758, 0.012618541717529297, 0.013448476791381836, 0.014278411865234375, 0.015108346939086914, 0.015938282012939453, 0.016768217086791992, 0.01759815216064453, 0.01842808723449707, 0.01925802230834961, 0.02008795738220215, 0.020917892456054688, 0.021747827529907227, 0.022577762603759766, 0.023407697677612305, 0.024237632751464844, 0.025067567825317383, 0.025897502899169922, 0.02672743797302246, 0.027557373046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 29.0, 973.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02001454494893551, -0.01960132271051407, -0.01918810047209263, -0.018774880096316338, -0.018361657857894897, -0.017948435619473457, -0.017535213381052017, -0.017121993005275726, -0.016708770766854286, -0.016295548528432846, -0.015882326290011406, -0.01546910498291254, -0.015055883675813675, -0.014642661437392235, -0.01422944013029337, -0.01381621789187193, -0.013402996584773064, -0.012989774346351624, -0.012576553039252758, -0.012163330800831318, -0.011750109493732452, -0.011336887255311012, -0.010923665948212147, -0.010510443709790707, -0.010097221471369267, -0.009683999232947826, -0.009270777925848961, -0.00885755568742752, -0.008444334380328655, -0.008031112141907215, -0.00761789083480835, -0.0072046685963869095, -0.006791446823626757, -0.006378225050866604, -0.005965003278106451, -0.005551781505346298, -0.005138559732586145, -0.004725337959825993, -0.0043121157214045525, -0.0038988941814750433, -0.0034856724087148905, -0.0030724506359547377, -0.002659228863194585, -0.0022460068576037884, -0.0018327852012589574, -0.0014195633120834827, -0.00100634153932333, -0.0005931197665631771, -0.0001798979938030243, 0.00023332380806095898, 0.0006465456099249423, 0.001059767440892756, 0.0014729892136529088, 0.0018862111028283834, 0.0022994328755885363, 0.002712654648348689, 0.003125876421108842, 0.0035390981938689947, 0.003952320199459791, 0.004365541972219944, 0.004778763744980097, 0.00519198551774025, 0.0056052072905004025, 0.006018429063260555, 0.006431650836020708]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 13.0, 13.0, 15.0, 18.0, 27.0, 27.0, 28.0, 45.0, 43.0, 45.0, 55.0, 43.0, 57.0, 52.0, 70.0, 61.0, 59.0, 53.0, 52.0, 38.0, 33.0, 38.0, 29.0, 22.0, 22.0, 13.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008541345596313477, -0.000818164087831974, -0.0007821936160326004, -0.0007462231442332268, -0.0007102526724338531, -0.0006742822006344795, -0.0006383117288351059, -0.0006023412570357323, -0.0005663707852363586, -0.000530400313436985, -0.0004944298416376114, -0.00045845936983823776, -0.00042248889803886414, -0.0003865184262394905, -0.0003505479544401169, -0.00031457748264074326, -0.00027860701084136963, -0.000242636539041996, -0.00020666606724262238, -0.00017069559544324875, -0.00013472512364387512, -9.87546518445015e-05, -6.278418004512787e-05, -2.6813708245754242e-05, 9.156763553619385e-06, 4.512723535299301e-05, 8.109770715236664e-05, 0.00011706817895174026, 0.0001530386507511139, 0.00018900912255048752, 0.00022497959434986115, 0.00026095006614923477, 0.0002969205379486084, 0.000332891009747982, 0.00036886148154735565, 0.0004048319533467293, 0.0004408024251461029, 0.00047677289694547653, 0.0005127433687448502, 0.0005487138405442238, 0.0005846843123435974, 0.000620654784142971, 0.0006566252559423447, 0.0006925957277417183, 0.0007285661995410919, 0.0007645366713404655, 0.0008005071431398392, 0.0008364776149392128, 0.0008724480867385864, 0.00090841855853796, 0.0009443890303373337, 0.0009803595021367073, 0.001016329973936081, 0.0010523004457354546, 0.0010882709175348282, 0.0011242413893342018, 0.0011602118611335754, 0.001196182332932949, 0.0012321528047323227, 0.0012681232765316963, 0.00130409374833107, 0.0013400642201304436, 0.0013760346919298172, 0.0014120051637291908, 0.0014479756355285645]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 13.0, 24.0, 36.0, 32.0, 62.0, 83.0, 118.0, 162.0, 286.0, 381.0, 584.0, 940.0, 1550.0, 2575.0, 4714.0, 8813.0, 17360.0, 41374.0, 235358.0, 623616.0, 62569.0, 23148.0, 10850.0, 5678.0, 3063.0, 1905.0, 1146.0, 760.0, 433.0, 313.0, 183.0, 122.0, 89.0, 52.0, 57.0, 28.0, 28.0, 5.0, 13.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.8125, -16.170166015625, -15.52783203125, -14.885498046875, -14.2431640625, -13.600830078125, -12.95849609375, -12.316162109375, -11.673828125, -11.031494140625, -10.38916015625, -9.746826171875, -9.1044921875, -8.462158203125, -7.81982421875, -7.177490234375, -6.53515625, -5.892822265625, -5.25048828125, -4.608154296875, -3.9658203125, -3.323486328125, -2.68115234375, -2.038818359375, -1.396484375, -0.754150390625, -0.11181640625, 0.530517578125, 1.1728515625, 1.815185546875, 2.45751953125, 3.099853515625, 3.7421875, 4.384521484375, 5.02685546875, 5.669189453125, 6.3115234375, 6.953857421875, 7.59619140625, 8.238525390625, 8.880859375, 9.523193359375, 10.16552734375, 10.807861328125, 11.4501953125, 12.092529296875, 12.73486328125, 13.377197265625, 14.01953125, 14.661865234375, 15.30419921875, 15.946533203125, 16.5888671875, 17.231201171875, 17.87353515625, 18.515869140625, 19.158203125, 19.800537109375, 20.44287109375, 21.085205078125, 21.7275390625, 22.369873046875, 23.01220703125, 23.654541015625, 24.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 24.0, 25.0, 24.0, 34.0, 37.0, 33.0, 45.0, 50.0, 61.0, 85.0, 192.0, 1723.0, 121.0, 81.0, 58.0, 56.0, 44.0, 32.0, 28.0, 26.0, 34.0, 25.0, 16.0, 25.0, 11.0, 5.0, 20.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.27734375, -30.2109375, -29.14453125, -28.078125, -27.01171875, -25.9453125, -24.87890625, -23.8125, -22.74609375, -21.6796875, -20.61328125, -19.546875, -18.48046875, -17.4140625, -16.34765625, -15.28125, -14.21484375, -13.1484375, -12.08203125, -11.015625, -9.94921875, -8.8828125, -7.81640625, -6.75, -5.68359375, -4.6171875, -3.55078125, -2.484375, -1.41796875, -0.3515625, 0.71484375, 1.78125, 2.84765625, 3.9140625, 4.98046875, 6.046875, 7.11328125, 8.1796875, 9.24609375, 10.3125, 11.37890625, 12.4453125, 13.51171875, 14.578125, 15.64453125, 16.7109375, 17.77734375, 18.84375, 19.91015625, 20.9765625, 22.04296875, 23.109375, 24.17578125, 25.2421875, 26.30859375, 27.375, 28.44140625, 29.5078125, 30.57421875, 31.640625, 32.70703125, 33.7734375, 34.83984375, 35.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 33.0, 35.0, 35.0, 51.0, 71.0, 93.0, 127.0, 216.0, 364.0, 1078.0, 4535.0, 36465.0, 2971330.0, 119285.0, 8852.0, 1730.0, 544.0, 243.0, 172.0, 103.0, 71.0, 59.0, 38.0, 34.0, 21.0, 20.0, 10.0, 11.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.4833984375, -62.154296875, -59.8251953125, -57.49609375, -55.1669921875, -52.837890625, -50.5087890625, -48.1796875, -45.8505859375, -43.521484375, -41.1923828125, -38.86328125, -36.5341796875, -34.205078125, -31.8759765625, -29.546875, -27.2177734375, -24.888671875, -22.5595703125, -20.23046875, -17.9013671875, -15.572265625, -13.2431640625, -10.9140625, -8.5849609375, -6.255859375, -3.9267578125, -1.59765625, 0.7314453125, 3.060546875, 5.3896484375, 7.71875, 10.0478515625, 12.376953125, 14.7060546875, 17.03515625, 19.3642578125, 21.693359375, 24.0224609375, 26.3515625, 28.6806640625, 31.009765625, 33.3388671875, 35.66796875, 37.9970703125, 40.326171875, 42.6552734375, 44.984375, 47.3134765625, 49.642578125, 51.9716796875, 54.30078125, 56.6298828125, 58.958984375, 61.2880859375, 63.6171875, 65.9462890625, 68.275390625, 70.6044921875, 72.93359375, 75.2626953125, 77.591796875, 79.9208984375, 82.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 122.0, 866.0, 27.0], "bins": [-1239.0430908203125, -1219.1612548828125, -1199.279296875, -1179.3974609375, -1159.515625, -1139.6337890625, -1119.7518310546875, -1099.8699951171875, -1079.9881591796875, -1060.1063232421875, -1040.224365234375, -1020.342529296875, -1000.460693359375, -980.5787963867188, -960.6968994140625, -940.8150634765625, -920.93310546875, -901.0512084960938, -881.1693725585938, -861.2874755859375, -841.4056396484375, -821.5237426757812, -801.641845703125, -781.760009765625, -761.878173828125, -741.9962768554688, -722.1144409179688, -702.2325439453125, -682.3507080078125, -662.4688110351562, -642.5869140625, -622.705078125, -602.8231811523438, -582.9412841796875, -563.0594482421875, -543.1775512695312, -523.2957153320312, -503.413818359375, -483.5319519042969, -463.65008544921875, -443.7681884765625, -423.8863220214844, -404.00445556640625, -384.12255859375, -364.2406921386719, -344.35882568359375, -324.4769592285156, -304.5950927734375, -284.71319580078125, -264.8313293457031, -244.94944763183594, -225.0675811767578, -205.18569946289062, -185.3038330078125, -165.42196655273438, -145.5400848388672, -125.65821838378906, -105.7763442993164, -85.89447021484375, -66.01260375976562, -46.13072967529297, -26.248855590820312, -6.3669891357421875, 13.514892578125, 33.39675521850586]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 5.0, 6.0, 13.0, 14.0, 18.0, 23.0, 19.0, 21.0, 32.0, 28.0, 34.0, 34.0, 29.0, 35.0, 35.0, 31.0, 45.0, 38.0, 52.0, 36.0, 42.0, 38.0, 41.0, 35.0, 30.0, 29.0, 29.0, 30.0, 24.0, 13.0, 21.0, 12.0, 16.0, 13.0, 16.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.21829223632812, -75.77754974365234, -73.33680725097656, -70.89607238769531, -68.45532989501953, -66.01458740234375, -63.57384490966797, -61.13310241699219, -58.69236373901367, -56.25162124633789, -53.810882568359375, -51.370140075683594, -48.92939758300781, -46.4886589050293, -44.047916412353516, -41.607177734375, -39.16643524169922, -36.72569274902344, -34.28495407104492, -31.84421157836914, -29.403470993041992, -26.962730407714844, -24.521987915039062, -22.081247329711914, -19.640506744384766, -17.199766159057617, -14.759024620056152, -12.318283081054688, -9.877542495727539, -7.436801910400391, -4.996060371398926, -2.555318832397461, -0.11458587646484375, 2.326155185699463, 4.7668962478637695, 7.207637310028076, 9.648378372192383, 12.089118957519531, 14.529860496520996, 16.97060203552246, 19.41134262084961, 21.852083206176758, 24.292823791503906, 26.733566284179688, 29.174306869506836, 31.615047454833984, 34.055789947509766, 36.49652862548828, 38.93727111816406, 41.378013610839844, 43.81875228881836, 46.25949478149414, 48.700233459472656, 51.14097595214844, 53.58171844482422, 56.0224609375, 58.463199615478516, 60.9039421081543, 63.34468078613281, 65.7854232788086, 68.22616577148438, 70.66690063476562, 73.1076431274414, 75.54838562011719, 77.98912811279297]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 9.0, 14.0, 19.0, 23.0, 31.0, 28.0, 34.0, 26.0, 38.0, 33.0, 30.0, 40.0, 40.0, 41.0, 31.0, 34.0, 35.0, 44.0, 38.0, 38.0, 31.0, 35.0, 32.0, 29.0, 25.0, 23.0, 26.0, 17.0, 12.0, 7.0, 17.0, 8.0, 9.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-11.2421875, -10.89111328125, -10.5400390625, -10.18896484375, -9.837890625, -9.48681640625, -9.1357421875, -8.78466796875, -8.43359375, -8.08251953125, -7.7314453125, -7.38037109375, -7.029296875, -6.67822265625, -6.3271484375, -5.97607421875, -5.625, -5.27392578125, -4.9228515625, -4.57177734375, -4.220703125, -3.86962890625, -3.5185546875, -3.16748046875, -2.81640625, -2.46533203125, -2.1142578125, -1.76318359375, -1.412109375, -1.06103515625, -0.7099609375, -0.35888671875, -0.0078125, 0.34326171875, 0.6943359375, 1.04541015625, 1.396484375, 1.74755859375, 2.0986328125, 2.44970703125, 2.80078125, 3.15185546875, 3.5029296875, 3.85400390625, 4.205078125, 4.55615234375, 4.9072265625, 5.25830078125, 5.609375, 5.96044921875, 6.3115234375, 6.66259765625, 7.013671875, 7.36474609375, 7.7158203125, 8.06689453125, 8.41796875, 8.76904296875, 9.1201171875, 9.47119140625, 9.822265625, 10.17333984375, 10.5244140625, 10.87548828125, 11.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 14.0, 18.0, 19.0, 20.0, 26.0, 46.0, 70.0, 124.0, 200.0, 383.0, 794.0, 2090.0, 6047.0, 21449.0, 234319.0, 3529361.0, 362935.0, 25184.0, 6684.0, 2394.0, 986.0, 445.0, 224.0, 110.0, 77.0, 53.0, 41.0, 19.0, 27.0, 15.0, 11.0, 8.0, 10.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.16357421875, -36.8271484375, -35.49072265625, -34.154296875, -32.81787109375, -31.4814453125, -30.14501953125, -28.80859375, -27.47216796875, -26.1357421875, -24.79931640625, -23.462890625, -22.12646484375, -20.7900390625, -19.45361328125, -18.1171875, -16.78076171875, -15.4443359375, -14.10791015625, -12.771484375, -11.43505859375, -10.0986328125, -8.76220703125, -7.42578125, -6.08935546875, -4.7529296875, -3.41650390625, -2.080078125, -0.74365234375, 0.5927734375, 1.92919921875, 3.265625, 4.60205078125, 5.9384765625, 7.27490234375, 8.611328125, 9.94775390625, 11.2841796875, 12.62060546875, 13.95703125, 15.29345703125, 16.6298828125, 17.96630859375, 19.302734375, 20.63916015625, 21.9755859375, 23.31201171875, 24.6484375, 25.98486328125, 27.3212890625, 28.65771484375, 29.994140625, 31.33056640625, 32.6669921875, 34.00341796875, 35.33984375, 36.67626953125, 38.0126953125, 39.34912109375, 40.685546875, 42.02197265625, 43.3583984375, 44.69482421875, 46.03125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 13.0, 10.0, 16.0, 17.0, 24.0, 42.0, 43.0, 59.0, 70.0, 121.0, 205.0, 390.0, 726.0, 872.0, 573.0, 323.0, 185.0, 109.0, 71.0, 63.0, 28.0, 37.0, 11.0, 7.0, 9.0, 8.0, 3.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.28125, -31.438720703125, -30.59619140625, -29.753662109375, -28.9111328125, -28.068603515625, -27.22607421875, -26.383544921875, -25.541015625, -24.698486328125, -23.85595703125, -23.013427734375, -22.1708984375, -21.328369140625, -20.48583984375, -19.643310546875, -18.80078125, -17.958251953125, -17.11572265625, -16.273193359375, -15.4306640625, -14.588134765625, -13.74560546875, -12.903076171875, -12.060546875, -11.218017578125, -10.37548828125, -9.532958984375, -8.6904296875, -7.847900390625, -7.00537109375, -6.162841796875, -5.3203125, -4.477783203125, -3.63525390625, -2.792724609375, -1.9501953125, -1.107666015625, -0.26513671875, 0.577392578125, 1.419921875, 2.262451171875, 3.10498046875, 3.947509765625, 4.7900390625, 5.632568359375, 6.47509765625, 7.317626953125, 8.16015625, 9.002685546875, 9.84521484375, 10.687744140625, 11.5302734375, 12.372802734375, 13.21533203125, 14.057861328125, 14.900390625, 15.742919921875, 16.58544921875, 17.427978515625, 18.2705078125, 19.113037109375, 19.95556640625, 20.798095703125, 21.640625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 7.0, 8.0, 2.0, 9.0, 15.0, 33.0, 36.0, 54.0, 76.0, 142.0, 292.0, 1007.0, 22037.0, 4091031.0, 76887.0, 1793.0, 362.0, 147.0, 82.0, 62.0, 42.0, 38.0, 24.0, 21.0, 12.0, 11.0, 15.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.25, -125.359375, -120.46875, -115.578125, -110.6875, -105.796875, -100.90625, -96.015625, -91.125, -86.234375, -81.34375, -76.453125, -71.5625, -66.671875, -61.78125, -56.890625, -52.0, -47.109375, -42.21875, -37.328125, -32.4375, -27.546875, -22.65625, -17.765625, -12.875, -7.984375, -3.09375, 1.796875, 6.6875, 11.578125, 16.46875, 21.359375, 26.25, 31.140625, 36.03125, 40.921875, 45.8125, 50.703125, 55.59375, 60.484375, 65.375, 70.265625, 75.15625, 80.046875, 84.9375, 89.828125, 94.71875, 99.609375, 104.5, 109.390625, 114.28125, 119.171875, 124.0625, 128.953125, 133.84375, 138.734375, 143.625, 148.515625, 153.40625, 158.296875, 163.1875, 168.078125, 172.96875, 177.859375, 182.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 15.0, 39.0, 62.0, 133.0, 234.0, 234.0, 154.0, 82.0, 32.0, 11.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.8446960449219, -255.1780548095703, -249.51141357421875, -243.8447723388672, -238.17813110351562, -232.51148986816406, -226.8448486328125, -221.17822265625, -215.51156616210938, -209.8449249267578, -204.17828369140625, -198.5116424560547, -192.84500122070312, -187.17835998535156, -181.51171875, -175.8450927734375, -170.17845153808594, -164.51181030273438, -158.8451690673828, -153.17852783203125, -147.5118865966797, -141.84524536132812, -136.17861938476562, -130.511962890625, -124.84532928466797, -119.1786880493164, -113.51204681396484, -107.84541320800781, -102.17877197265625, -96.51213073730469, -90.84548950195312, -85.17884826660156, -79.51219177246094, -73.84555053710938, -68.17890930175781, -62.512271881103516, -56.84563064575195, -51.17898941040039, -45.512351989746094, -39.84571075439453, -34.17906951904297, -28.512428283691406, -22.845788955688477, -17.179149627685547, -11.512508392333984, -5.845867156982422, -0.179229736328125, 5.4874114990234375, 11.154052734375, 16.820693969726562, 22.487333297729492, 28.153972625732422, 33.820613861083984, 39.48725509643555, 45.153892517089844, 50.820533752441406, 56.48717498779297, 62.15381622314453, 67.8204574584961, 73.48709106445312, 79.15373229980469, 84.82037353515625, 90.48701477050781, 96.15365600585938, 101.82029724121094]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 7.0, 7.0, 19.0, 17.0, 12.0, 21.0, 17.0, 25.0, 18.0, 24.0, 31.0, 35.0, 38.0, 39.0, 25.0, 31.0, 41.0, 36.0, 37.0, 41.0, 38.0, 38.0, 36.0, 34.0, 50.0, 34.0, 24.0, 33.0, 27.0, 28.0, 20.0, 19.0, 12.0, 17.0, 10.0, 5.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-68.22395324707031, -66.15882110595703, -64.09368133544922, -62.02854919433594, -59.96341323852539, -57.898277282714844, -55.8331413269043, -53.76800537109375, -51.70287322998047, -49.63773727416992, -47.572601318359375, -45.507469177246094, -43.44233322143555, -41.377197265625, -39.31206130981445, -37.246925354003906, -35.18178939819336, -33.11665344238281, -31.0515193939209, -28.98638343811035, -26.921249389648438, -24.85611343383789, -22.790977478027344, -20.725841522216797, -18.660707473754883, -16.595571517944336, -14.530437469482422, -12.465301513671875, -10.400166511535645, -8.335031509399414, -6.269895553588867, -4.204760551452637, -2.1396255493164062, -0.07449030876159668, 1.990644931793213, 4.055780410766602, 6.120915412902832, 8.186050415039062, 10.25118637084961, 12.31632137298584, 14.38145637512207, 16.446592330932617, 18.51172637939453, 20.576862335205078, 22.641998291015625, 24.70713233947754, 26.772268295288086, 28.83740234375, 30.902538299560547, 32.967674255371094, 35.03281021118164, 37.09794616699219, 39.16307830810547, 41.228214263916016, 43.29335021972656, 45.35848617553711, 47.423622131347656, 49.4887580871582, 51.55389404296875, 53.61902618408203, 55.68416213989258, 57.749298095703125, 59.81443405151367, 61.87957000732422, 63.9447021484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 25.0, 39.0, 62.0, 89.0, 139.0, 243.0, 269.0, 428.0, 691.0, 1003.0, 1454.0, 2269.0, 3409.0, 5156.0, 7910.0, 12275.0, 19321.0, 30183.0, 48509.0, 77044.0, 120369.0, 187091.0, 191843.0, 123560.0, 78273.0, 49288.0, 31043.0, 19817.0, 12621.0, 8215.0, 5449.0, 3404.0, 2350.0, 1565.0, 1011.0, 704.0, 469.0, 307.0, 198.0, 134.0, 91.0, 56.0, 41.0, 32.0, 25.0, 15.0, 2.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.270751953125, -0.2625541687011719, -0.25435638427734375, -0.24615859985351562, -0.2379608154296875, -0.22976303100585938, -0.22156524658203125, -0.21336746215820312, -0.205169677734375, -0.19697189331054688, -0.18877410888671875, -0.18057632446289062, -0.1723785400390625, -0.16418075561523438, -0.15598297119140625, -0.14778518676757812, -0.13958740234375, -0.13138961791992188, -0.12319183349609375, -0.11499404907226562, -0.1067962646484375, -0.09859848022460938, -0.09040069580078125, -0.08220291137695312, -0.074005126953125, -0.06580734252929688, -0.05760955810546875, -0.049411773681640625, -0.0412139892578125, -0.033016204833984375, -0.02481842041015625, -0.016620635986328125, -0.0084228515625, -0.000225067138671875, 0.00797271728515625, 0.016170501708984375, 0.0243682861328125, 0.032566070556640625, 0.04076385498046875, 0.048961639404296875, 0.057159423828125, 0.06535720825195312, 0.07355499267578125, 0.08175277709960938, 0.0899505615234375, 0.09814834594726562, 0.10634613037109375, 0.11454391479492188, 0.12274169921875, 0.13093948364257812, 0.13913726806640625, 0.14733505249023438, 0.1555328369140625, 0.16373062133789062, 0.17192840576171875, 0.18012619018554688, 0.188323974609375, 0.19652175903320312, 0.20471954345703125, 0.21291732788085938, 0.2211151123046875, 0.22931289672851562, 0.23751068115234375, 0.24570846557617188, 0.25390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 4.0, 12.0, 15.0, 14.0, 15.0, 27.0, 15.0, 15.0, 20.0, 18.0, 29.0, 27.0, 28.0, 33.0, 26.0, 33.0, 49.0, 35.0, 38.0, 1068.0, 42.0, 35.0, 37.0, 35.0, 39.0, 38.0, 35.0, 19.0, 21.0, 28.0, 26.0, 21.0, 15.0, 15.0, 13.0, 18.0, 10.0, 9.0, 8.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9609375, -7.701904296875, -7.44287109375, -7.183837890625, -6.9248046875, -6.665771484375, -6.40673828125, -6.147705078125, -5.888671875, -5.629638671875, -5.37060546875, -5.111572265625, -4.8525390625, -4.593505859375, -4.33447265625, -4.075439453125, -3.81640625, -3.557373046875, -3.29833984375, -3.039306640625, -2.7802734375, -2.521240234375, -2.26220703125, -2.003173828125, -1.744140625, -1.485107421875, -1.22607421875, -0.967041015625, -0.7080078125, -0.448974609375, -0.18994140625, 0.069091796875, 0.328125, 0.587158203125, 0.84619140625, 1.105224609375, 1.3642578125, 1.623291015625, 1.88232421875, 2.141357421875, 2.400390625, 2.659423828125, 2.91845703125, 3.177490234375, 3.4365234375, 3.695556640625, 3.95458984375, 4.213623046875, 4.47265625, 4.731689453125, 4.99072265625, 5.249755859375, 5.5087890625, 5.767822265625, 6.02685546875, 6.285888671875, 6.544921875, 6.803955078125, 7.06298828125, 7.322021484375, 7.5810546875, 7.840087890625, 8.09912109375, 8.358154296875, 8.6171875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 6.0, 7.0, 11.0, 11.0, 19.0, 23.0, 38.0, 57.0, 92.0, 115.0, 174.0, 254.0, 324.0, 432.0, 681.0, 977.0, 1270.0, 1721.0, 2336.0, 3249.0, 4757.0, 6824.0, 9663.0, 13874.0, 20319.0, 29646.0, 44018.0, 67707.0, 106036.0, 172016.0, 1244791.0, 125251.0, 78771.0, 50890.0, 34106.0, 22939.0, 15990.0, 11174.0, 7684.0, 5576.0, 3761.0, 2725.0, 1924.0, 1426.0, 1023.0, 732.0, 494.0, 372.0, 240.0, 200.0, 129.0, 100.0, 58.0, 47.0, 34.0, 26.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.11517333984375, -0.11147880554199219, -0.10778427124023438, -0.10408973693847656, -0.10039520263671875, -0.09670066833496094, -0.09300613403320312, -0.08931159973144531, -0.0856170654296875, -0.08192253112792969, -0.07822799682617188, -0.07453346252441406, -0.07083892822265625, -0.06714439392089844, -0.06344985961914062, -0.05975532531738281, -0.056060791015625, -0.05236625671386719, -0.048671722412109375, -0.04497718811035156, -0.04128265380859375, -0.03758811950683594, -0.033893585205078125, -0.030199050903320312, -0.0265045166015625, -0.022809982299804688, -0.019115447998046875, -0.015420913696289062, -0.01172637939453125, -0.008031845092773438, -0.004337310791015625, -0.0006427764892578125, 0.0030517578125, 0.0067462921142578125, 0.010440826416015625, 0.014135360717773438, 0.01782989501953125, 0.021524429321289062, 0.025218963623046875, 0.028913497924804688, 0.0326080322265625, 0.03630256652832031, 0.039997100830078125, 0.04369163513183594, 0.04738616943359375, 0.05108070373535156, 0.054775238037109375, 0.05846977233886719, 0.062164306640625, 0.06585884094238281, 0.06955337524414062, 0.07324790954589844, 0.07694244384765625, 0.08063697814941406, 0.08433151245117188, 0.08802604675292969, 0.0917205810546875, 0.09541511535644531, 0.09910964965820312, 0.10280418395996094, 0.10649871826171875, 0.11019325256347656, 0.11388778686523438, 0.11758232116699219, 0.12127685546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 7.0, 11.0, 12.0, 12.0, 15.0, 29.0, 32.0, 28.0, 39.0, 41.0, 46.0, 56.0, 61.0, 62.0, 53.0, 67.0, 65.0, 59.0, 40.0, 44.0, 24.0, 28.0, 21.0, 18.0, 15.0, 11.0, 4.0, 9.0, 17.0, 3.0, 7.0, 1.0, 7.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0006089210510253906, -0.0005890354514122009, -0.0005691498517990112, -0.0005492642521858215, -0.0005293786525726318, -0.0005094930529594421, -0.0004896074533462524, -0.00046972185373306274, -0.00044983625411987305, -0.00042995065450668335, -0.00041006505489349365, -0.00039017945528030396, -0.00037029385566711426, -0.00035040825605392456, -0.00033052265644073486, -0.00031063705682754517, -0.00029075145721435547, -0.00027086585760116577, -0.0002509802579879761, -0.00023109465837478638, -0.00021120905876159668, -0.00019132345914840698, -0.00017143785953521729, -0.0001515522599220276, -0.0001316666603088379, -0.0001117810606956482, -9.18954610824585e-05, -7.20098614692688e-05, -5.21242618560791e-05, -3.2238662242889404e-05, -1.2353062629699707e-05, 7.53253698348999e-06, 2.7418136596679688e-05, 4.7303736209869385e-05, 6.718933582305908e-05, 8.707493543624878e-05, 0.00010696053504943848, 0.00012684613466262817, 0.00014673173427581787, 0.00016661733388900757, 0.00018650293350219727, 0.00020638853311538696, 0.00022627413272857666, 0.00024615973234176636, 0.00026604533195495605, 0.00028593093156814575, 0.00030581653118133545, 0.00032570213079452515, 0.00034558773040771484, 0.00036547333002090454, 0.00038535892963409424, 0.00040524452924728394, 0.00042513012886047363, 0.00044501572847366333, 0.00046490132808685303, 0.0004847869277000427, 0.0005046725273132324, 0.0005245581269264221, 0.0005444437265396118, 0.0005643293261528015, 0.0005842149257659912, 0.0006041005253791809, 0.0006239861249923706, 0.0006438717246055603, 0.00066375732421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 7.0, 2.0, 4.0, 3.0, 19.0, 9.0, 4.0, 11.0, 14.0, 19.0, 26.0, 29.0, 36.0, 56.0, 69.0, 125.0, 234.0, 660.0, 17312.0, 1021426.0, 7418.0, 494.0, 185.0, 93.0, 58.0, 43.0, 46.0, 34.0, 18.0, 11.0, 11.0, 12.0, 8.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.015869140625, -0.015394210815429688, -0.014919281005859375, -0.014444351196289062, -0.01396942138671875, -0.013494491577148438, -0.013019561767578125, -0.012544631958007812, -0.0120697021484375, -0.011594772338867188, -0.011119842529296875, -0.010644912719726562, -0.01016998291015625, -0.009695053100585938, -0.009220123291015625, -0.008745193481445312, -0.008270263671875, -0.0077953338623046875, -0.007320404052734375, -0.0068454742431640625, -0.00637054443359375, -0.0058956146240234375, -0.005420684814453125, -0.0049457550048828125, -0.0044708251953125, -0.0039958953857421875, -0.003520965576171875, -0.0030460357666015625, -0.00257110595703125, -0.0020961761474609375, -0.001621246337890625, -0.0011463165283203125, -0.00067138671875, -0.0001964569091796875, 0.000278472900390625, 0.0007534027099609375, 0.00122833251953125, 0.0017032623291015625, 0.002178192138671875, 0.0026531219482421875, 0.0031280517578125, 0.0036029815673828125, 0.004077911376953125, 0.0045528411865234375, 0.00502777099609375, 0.0055027008056640625, 0.005977630615234375, 0.0064525604248046875, 0.006927490234375, 0.0074024200439453125, 0.007877349853515625, 0.008352279663085938, 0.00882720947265625, 0.009302139282226562, 0.009777069091796875, 0.010251998901367188, 0.0107269287109375, 0.011201858520507812, 0.011676788330078125, 0.012151718139648438, 0.01262664794921875, 0.013101577758789062, 0.013576507568359375, 0.014051437377929688, 0.0145263671875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 31.0, 982.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026336494833230972, -0.025868872180581093, -0.025401249527931213, -0.024933626875281334, -0.024466004222631454, -0.023998383432626724, -0.023530758917331696, -0.023063138127326965, -0.022595515474677086, -0.022127892822027206, -0.021660270169377327, -0.021192647516727448, -0.020725024864077568, -0.02025740221142769, -0.01978978142142296, -0.01932215876877308, -0.0188545361161232, -0.01838691346347332, -0.01791929081082344, -0.01745166815817356, -0.01698404550552368, -0.01651642471551895, -0.016048800200223923, -0.015581178478896618, -0.015113554894924164, -0.014645932242274284, -0.014178309589624405, -0.013710686936974525, -0.01324306521564722, -0.012775442562997341, -0.012307819910347462, -0.011840197257697582, -0.011372575536370277, -0.010904952883720398, -0.010437330231070518, -0.009969707578420639, -0.009502085857093334, -0.009034463204443455, -0.008566840551793575, -0.008099217899143696, -0.007631596177816391, -0.0071639735251665115, -0.006696351338177919, -0.00622872868552804, -0.005761106498539448, -0.005293483845889568, -0.004825861193239689, -0.004358238540589809, -0.0038906161207705736, -0.003422993700951338, -0.0029553710483014584, -0.0024877486284822226, -0.0020201262086629868, -0.001552503788843751, -0.0010848811361938715, -0.0006172587163746357, -0.0001496362965553999, 0.0003179861814714968, 0.0007856086594983935, 0.0012532311957329512, 0.001720853615552187, 0.0021884760353714228, 0.0026560986880213022, 0.003123721107840538, 0.003591343527659774]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 10.0, 11.0, 18.0, 15.0, 23.0, 34.0, 52.0, 49.0, 55.0, 49.0, 71.0, 72.0, 79.0, 77.0, 70.0, 58.0, 49.0, 39.0, 45.0, 35.0, 24.0, 18.0, 16.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008350610733032227, -0.0008047772571444511, -0.0007744934409856796, -0.0007442096248269081, -0.0007139258086681366, -0.0006836419925093651, -0.0006533581763505936, -0.000623074360191822, -0.0005927905440330505, -0.000562506727874279, -0.0005322229117155075, -0.000501939095556736, -0.0004716552793979645, -0.00044137146323919296, -0.00041108764708042145, -0.00038080383092164993, -0.0003505200147628784, -0.0003202361986041069, -0.0002899523824453354, -0.0002596685662865639, -0.00022938475012779236, -0.00019910093396902084, -0.00016881711781024933, -0.00013853330165147781, -0.0001082494854927063, -7.796566933393478e-05, -4.768185317516327e-05, -1.7398037016391754e-05, 1.288577914237976e-05, 4.3169595301151276e-05, 7.345341145992279e-05, 0.0001037372276186943, 0.00013402104377746582, 0.00016430485993623734, 0.00019458867609500885, 0.00022487249225378036, 0.0002551563084125519, 0.0002854401245713234, 0.0003157239407300949, 0.0003460077568888664, 0.00037629157304763794, 0.00040657538920640945, 0.00043685920536518097, 0.0004671430215239525, 0.000497426837682724, 0.0005277106538414955, 0.000557994470000267, 0.0005882782861590385, 0.0006185621023178101, 0.0006488459184765816, 0.0006791297346353531, 0.0007094135507941246, 0.0007396973669528961, 0.0007699811831116676, 0.0008002649992704391, 0.0008305488154292107, 0.0008608326315879822, 0.0008911164477467537, 0.0009214002639055252, 0.0009516840800642967, 0.0009819678962230682, 0.0010122517123818398, 0.0010425355285406113, 0.0010728193446993828, 0.0011031031608581543]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 5.0, 12.0, 14.0, 19.0, 23.0, 44.0, 65.0, 88.0, 115.0, 177.0, 276.0, 396.0, 575.0, 926.0, 1383.0, 2385.0, 4006.0, 7459.0, 15303.0, 41789.0, 288605.0, 585906.0, 59489.0, 18574.0, 8836.0, 4786.0, 2726.0, 1656.0, 983.0, 597.0, 409.0, 269.0, 198.0, 131.0, 113.0, 62.0, 32.0, 39.0, 28.0, 14.0, 10.0, 6.0, 3.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.7078857421875, -13.220458984375, -12.7330322265625, -12.24560546875, -11.7581787109375, -11.270751953125, -10.7833251953125, -10.2958984375, -9.8084716796875, -9.321044921875, -8.8336181640625, -8.34619140625, -7.8587646484375, -7.371337890625, -6.8839111328125, -6.396484375, -5.9090576171875, -5.421630859375, -4.9342041015625, -4.44677734375, -3.9593505859375, -3.471923828125, -2.9844970703125, -2.4970703125, -2.0096435546875, -1.522216796875, -1.0347900390625, -0.54736328125, -0.0599365234375, 0.427490234375, 0.9149169921875, 1.40234375, 1.8897705078125, 2.377197265625, 2.8646240234375, 3.35205078125, 3.8394775390625, 4.326904296875, 4.8143310546875, 5.3017578125, 5.7891845703125, 6.276611328125, 6.7640380859375, 7.25146484375, 7.7388916015625, 8.226318359375, 8.7137451171875, 9.201171875, 9.6885986328125, 10.176025390625, 10.6634521484375, 11.15087890625, 11.6383056640625, 12.125732421875, 12.6131591796875, 13.1005859375, 13.5880126953125, 14.075439453125, 14.5628662109375, 15.05029296875, 15.5377197265625, 16.025146484375, 16.5125732421875, 17.0]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 8.0, 11.0, 15.0, 22.0, 19.0, 18.0, 29.0, 37.0, 33.0, 30.0, 39.0, 45.0, 54.0, 82.0, 171.0, 1812.0, 114.0, 86.0, 55.0, 44.0, 41.0, 41.0, 31.0, 40.0, 26.0, 33.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.12646484375, -37.8779296875, -36.62939453125, -35.380859375, -34.13232421875, -32.8837890625, -31.63525390625, -30.38671875, -29.13818359375, -27.8896484375, -26.64111328125, -25.392578125, -24.14404296875, -22.8955078125, -21.64697265625, -20.3984375, -19.14990234375, -17.9013671875, -16.65283203125, -15.404296875, -14.15576171875, -12.9072265625, -11.65869140625, -10.41015625, -9.16162109375, -7.9130859375, -6.66455078125, -5.416015625, -4.16748046875, -2.9189453125, -1.67041015625, -0.421875, 0.82666015625, 2.0751953125, 3.32373046875, 4.572265625, 5.82080078125, 7.0693359375, 8.31787109375, 9.56640625, 10.81494140625, 12.0634765625, 13.31201171875, 14.560546875, 15.80908203125, 17.0576171875, 18.30615234375, 19.5546875, 20.80322265625, 22.0517578125, 23.30029296875, 24.548828125, 25.79736328125, 27.0458984375, 28.29443359375, 29.54296875, 30.79150390625, 32.0400390625, 33.28857421875, 34.537109375, 35.78564453125, 37.0341796875, 38.28271484375, 39.53125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 7.0, 5.0, 6.0, 6.0, 13.0, 14.0, 17.0, 27.0, 36.0, 46.0, 48.0, 71.0, 95.0, 136.0, 340.0, 1119.0, 10193.0, 2881240.0, 245333.0, 5405.0, 832.0, 221.0, 128.0, 70.0, 54.0, 51.0, 35.0, 33.0, 26.0, 22.0, 13.0, 11.0, 9.0, 6.0, 13.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-91.125, -88.2666015625, -85.408203125, -82.5498046875, -79.69140625, -76.8330078125, -73.974609375, -71.1162109375, -68.2578125, -65.3994140625, -62.541015625, -59.6826171875, -56.82421875, -53.9658203125, -51.107421875, -48.2490234375, -45.390625, -42.5322265625, -39.673828125, -36.8154296875, -33.95703125, -31.0986328125, -28.240234375, -25.3818359375, -22.5234375, -19.6650390625, -16.806640625, -13.9482421875, -11.08984375, -8.2314453125, -5.373046875, -2.5146484375, 0.34375, 3.2021484375, 6.060546875, 8.9189453125, 11.77734375, 14.6357421875, 17.494140625, 20.3525390625, 23.2109375, 26.0693359375, 28.927734375, 31.7861328125, 34.64453125, 37.5029296875, 40.361328125, 43.2197265625, 46.078125, 48.9365234375, 51.794921875, 54.6533203125, 57.51171875, 60.3701171875, 63.228515625, 66.0869140625, 68.9453125, 71.8037109375, 74.662109375, 77.5205078125, 80.37890625, 83.2373046875, 86.095703125, 88.9541015625, 91.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 16.0, 193.0, 543.0, 232.0, 24.0, 5.0, 0.0, 2.0], "bins": [-378.1009826660156, -371.63995361328125, -365.17889404296875, -358.7178649902344, -352.2568054199219, -345.7957763671875, -339.334716796875, -332.8736877441406, -326.41265869140625, -319.9516296386719, -313.4905700683594, -307.029541015625, -300.5684814453125, -294.1074523925781, -287.64642333984375, -281.18536376953125, -274.72430419921875, -268.2632751464844, -261.8022155761719, -255.3411865234375, -248.88014221191406, -242.41909790039062, -235.9580535888672, -229.49700927734375, -223.03598022460938, -216.57493591308594, -210.1138916015625, -203.65286254882812, -197.1918182373047, -190.73077392578125, -184.2697296142578, -177.80868530273438, -171.34765625, -164.88661193847656, -158.42556762695312, -151.96453857421875, -145.5034942626953, -139.04244995117188, -132.58140563964844, -126.120361328125, -119.65933227539062, -113.19828796386719, -106.73725128173828, -100.27620697021484, -93.81517028808594, -87.3541259765625, -80.89308166503906, -74.43203735351562, -67.97099304199219, -61.509952545166016, -55.048912048339844, -48.587867736816406, -42.126827239990234, -35.66578674316406, -29.204742431640625, -22.743701934814453, -16.282665252685547, -9.821623802185059, -3.3605823516845703, 3.1004600524902344, 9.561500549316406, 16.022541046142578, 22.483585357666016, 28.944625854492188, 35.40566635131836]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 7.0, 19.0, 15.0, 14.0, 22.0, 25.0, 24.0, 27.0, 26.0, 25.0, 32.0, 29.0, 38.0, 34.0, 39.0, 33.0, 40.0, 45.0, 38.0, 45.0, 38.0, 32.0, 26.0, 29.0, 25.0, 24.0, 24.0, 18.0, 23.0, 22.0, 16.0, 24.0, 16.0, 8.0, 15.0, 8.0, 5.0, 4.0, 10.0, 3.0, 6.0, 5.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-84.20744323730469, -81.36939239501953, -78.53133392333984, -75.69328308105469, -72.855224609375, -70.01717376708984, -67.17912292480469, -64.341064453125, -61.503013610839844, -58.66495895385742, -55.826904296875, -52.988853454589844, -50.15079879760742, -47.312744140625, -44.474693298339844, -41.63663864135742, -38.798583984375, -35.96052932739258, -33.122474670410156, -30.284423828125, -27.446369171142578, -24.608314514160156, -21.770261764526367, -18.932209014892578, -16.094154357910156, -13.25610065460205, -10.418046951293945, -7.57999324798584, -4.741939544677734, -1.903885841369629, 0.9341678619384766, 3.7722206115722656, 6.6102752685546875, 9.448328971862793, 12.286382675170898, 15.124436378479004, 17.96249008178711, 20.80054473876953, 23.63859748840332, 26.47665023803711, 29.31470489501953, 32.15275955200195, 34.990814208984375, 37.82886505126953, 40.66691970825195, 43.504974365234375, 46.34302520751953, 49.18107986450195, 52.019134521484375, 54.8571891784668, 57.69524383544922, 60.533294677734375, 63.3713493347168, 66.20940399169922, 69.04745483398438, 71.88551330566406, 74.72356414794922, 77.56161499023438, 80.39967346191406, 83.23772430419922, 86.07577514648438, 88.91383361816406, 91.75188446044922, 94.58993530273438, 97.42799377441406]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 13.0, 15.0, 18.0, 22.0, 23.0, 22.0, 27.0, 27.0, 37.0, 30.0, 31.0, 33.0, 31.0, 34.0, 40.0, 34.0, 48.0, 44.0, 47.0, 39.0, 31.0, 46.0, 38.0, 32.0, 23.0, 25.0, 19.0, 20.0, 20.0, 18.0, 13.0, 13.0, 7.0, 11.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.6953125, -11.310546875, -10.92578125, -10.541015625, -10.15625, -9.771484375, -9.38671875, -9.001953125, -8.6171875, -8.232421875, -7.84765625, -7.462890625, -7.078125, -6.693359375, -6.30859375, -5.923828125, -5.5390625, -5.154296875, -4.76953125, -4.384765625, -4.0, -3.615234375, -3.23046875, -2.845703125, -2.4609375, -2.076171875, -1.69140625, -1.306640625, -0.921875, -0.537109375, -0.15234375, 0.232421875, 0.6171875, 1.001953125, 1.38671875, 1.771484375, 2.15625, 2.541015625, 2.92578125, 3.310546875, 3.6953125, 4.080078125, 4.46484375, 4.849609375, 5.234375, 5.619140625, 6.00390625, 6.388671875, 6.7734375, 7.158203125, 7.54296875, 7.927734375, 8.3125, 8.697265625, 9.08203125, 9.466796875, 9.8515625, 10.236328125, 10.62109375, 11.005859375, 11.390625, 11.775390625, 12.16015625, 12.544921875, 12.9296875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 26.0, 42.0, 50.0, 81.0, 123.0, 172.0, 232.0, 317.0, 463.0, 723.0, 1092.0, 1612.0, 2520.0, 3823.0, 6411.0, 10861.0, 20646.0, 49804.0, 157302.0, 576315.0, 1623025.0, 1191677.0, 378867.0, 97068.0, 32230.0, 15359.0, 8634.0, 5103.0, 3222.0, 2047.0, 1459.0, 915.0, 545.0, 407.0, 309.0, 211.0, 152.0, 122.0, 79.0, 56.0, 30.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0], "bins": [-14.421875, -13.9686279296875, -13.515380859375, -13.0621337890625, -12.60888671875, -12.1556396484375, -11.702392578125, -11.2491455078125, -10.7958984375, -10.3426513671875, -9.889404296875, -9.4361572265625, -8.98291015625, -8.5296630859375, -8.076416015625, -7.6231689453125, -7.169921875, -6.7166748046875, -6.263427734375, -5.8101806640625, -5.35693359375, -4.9036865234375, -4.450439453125, -3.9971923828125, -3.5439453125, -3.0906982421875, -2.637451171875, -2.1842041015625, -1.73095703125, -1.2777099609375, -0.824462890625, -0.3712158203125, 0.08203125, 0.5352783203125, 0.988525390625, 1.4417724609375, 1.89501953125, 2.3482666015625, 2.801513671875, 3.2547607421875, 3.7080078125, 4.1612548828125, 4.614501953125, 5.0677490234375, 5.52099609375, 5.9742431640625, 6.427490234375, 6.8807373046875, 7.333984375, 7.7872314453125, 8.240478515625, 8.6937255859375, 9.14697265625, 9.6002197265625, 10.053466796875, 10.5067138671875, 10.9599609375, 11.4132080078125, 11.866455078125, 12.3197021484375, 12.77294921875, 13.2261962890625, 13.679443359375, 14.1326904296875, 14.5859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 13.0, 22.0, 34.0, 35.0, 52.0, 64.0, 81.0, 154.0, 226.0, 411.0, 695.0, 823.0, 589.0, 311.0, 167.0, 104.0, 63.0, 57.0, 34.0, 23.0, 20.0, 20.0, 17.0, 10.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.96875, -35.07568359375, -34.1826171875, -33.28955078125, -32.396484375, -31.50341796875, -30.6103515625, -29.71728515625, -28.82421875, -27.93115234375, -27.0380859375, -26.14501953125, -25.251953125, -24.35888671875, -23.4658203125, -22.57275390625, -21.6796875, -20.78662109375, -19.8935546875, -19.00048828125, -18.107421875, -17.21435546875, -16.3212890625, -15.42822265625, -14.53515625, -13.64208984375, -12.7490234375, -11.85595703125, -10.962890625, -10.06982421875, -9.1767578125, -8.28369140625, -7.390625, -6.49755859375, -5.6044921875, -4.71142578125, -3.818359375, -2.92529296875, -2.0322265625, -1.13916015625, -0.24609375, 0.64697265625, 1.5400390625, 2.43310546875, 3.326171875, 4.21923828125, 5.1123046875, 6.00537109375, 6.8984375, 7.79150390625, 8.6845703125, 9.57763671875, 10.470703125, 11.36376953125, 12.2568359375, 13.14990234375, 14.04296875, 14.93603515625, 15.8291015625, 16.72216796875, 17.615234375, 18.50830078125, 19.4013671875, 20.29443359375, 21.1875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 13.0, 19.0, 15.0, 23.0, 32.0, 29.0, 63.0, 97.0, 219.0, 536.0, 3075.0, 75594.0, 4028231.0, 82041.0, 3088.0, 594.0, 230.0, 106.0, 80.0, 48.0, 32.0, 35.0, 17.0, 12.0, 15.0, 4.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -83.8701171875, -80.302734375, -76.7353515625, -73.16796875, -69.6005859375, -66.033203125, -62.4658203125, -58.8984375, -55.3310546875, -51.763671875, -48.1962890625, -44.62890625, -41.0615234375, -37.494140625, -33.9267578125, -30.359375, -26.7919921875, -23.224609375, -19.6572265625, -16.08984375, -12.5224609375, -8.955078125, -5.3876953125, -1.8203125, 1.7470703125, 5.314453125, 8.8818359375, 12.44921875, 16.0166015625, 19.583984375, 23.1513671875, 26.71875, 30.2861328125, 33.853515625, 37.4208984375, 40.98828125, 44.5556640625, 48.123046875, 51.6904296875, 55.2578125, 58.8251953125, 62.392578125, 65.9599609375, 69.52734375, 73.0947265625, 76.662109375, 80.2294921875, 83.796875, 87.3642578125, 90.931640625, 94.4990234375, 98.06640625, 101.6337890625, 105.201171875, 108.7685546875, 112.3359375, 115.9033203125, 119.470703125, 123.0380859375, 126.60546875, 130.1728515625, 133.740234375, 137.3076171875, 140.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 21.0, 43.0, 104.0, 225.0, 298.0, 188.0, 87.0, 32.0, 12.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-356.9347229003906, -350.2441101074219, -343.5534973144531, -336.8628845214844, -330.1722717285156, -323.48162841796875, -316.791015625, -310.10040283203125, -303.4097900390625, -296.71917724609375, -290.028564453125, -283.33795166015625, -276.6473388671875, -269.95672607421875, -263.2660827636719, -256.5754699707031, -249.88485717773438, -243.19424438476562, -236.50363159179688, -229.81300354003906, -223.1223907470703, -216.43177795410156, -209.7411651611328, -203.050537109375, -196.3599395751953, -189.66932678222656, -182.9787139892578, -176.2880859375, -169.59747314453125, -162.9068603515625, -156.21624755859375, -149.525634765625, -142.8350067138672, -136.14439392089844, -129.4537811279297, -122.7631607055664, -116.07254028320312, -109.38192749023438, -102.69131469726562, -96.00069427490234, -89.31007385253906, -82.61946105957031, -75.92884063720703, -69.23822784423828, -62.547607421875, -55.85699462890625, -49.166378021240234, -42.47576141357422, -35.78514862060547, -29.094532012939453, -22.403915405273438, -15.713300704956055, -9.022684097290039, -2.3320693969726562, 4.358547210693359, 11.049163818359375, 17.73978042602539, 24.430397033691406, 31.121013641357422, 37.81163024902344, 44.50224304199219, 51.1928596496582, 57.88347625732422, 64.5740966796875, 71.26470947265625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 11.0, 5.0, 11.0, 8.0, 9.0, 14.0, 8.0, 14.0, 12.0, 14.0, 17.0, 15.0, 24.0, 22.0, 24.0, 30.0, 30.0, 38.0, 25.0, 39.0, 39.0, 46.0, 25.0, 45.0, 43.0, 23.0, 39.0, 31.0, 29.0, 31.0, 34.0, 27.0, 33.0, 14.0, 31.0, 16.0, 11.0, 26.0, 10.0, 12.0, 12.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.083892822265625, -59.129764556884766, -57.175636291503906, -55.22150802612305, -53.26737976074219, -51.313255310058594, -49.359127044677734, -47.404998779296875, -45.450870513916016, -43.496742248535156, -41.5426139831543, -39.58848571777344, -37.634361267089844, -35.68022918701172, -33.726104736328125, -31.771976470947266, -29.817848205566406, -27.863719940185547, -25.909591674804688, -23.95546531677246, -22.0013370513916, -20.047208786010742, -18.093082427978516, -16.138954162597656, -14.184825897216797, -12.230697631835938, -10.276570320129395, -8.322443008422852, -6.368314743041992, -4.414186477661133, -2.46005916595459, -0.5059318542480469, 1.4481964111328125, 3.4023241996765137, 5.356451988220215, 7.310579776763916, 9.264707565307617, 11.218835830688477, 13.17296314239502, 15.127090454101562, 17.081218719482422, 19.03534698486328, 20.98947525024414, 22.943601608276367, 24.897729873657227, 26.851858139038086, 28.805984497070312, 30.760112762451172, 32.71424102783203, 34.66836929321289, 36.62249755859375, 38.57662582397461, 40.53075408935547, 42.48487854003906, 44.43900680541992, 46.39313507080078, 48.34726333618164, 50.3013916015625, 52.25551986694336, 54.20964813232422, 56.16377258300781, 58.11790466308594, 60.07202911376953, 62.02615737915039, 63.98028564453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 20.0, 34.0, 33.0, 58.0, 89.0, 116.0, 192.0, 279.0, 402.0, 584.0, 900.0, 1293.0, 1802.0, 2693.0, 4068.0, 6039.0, 9374.0, 14132.0, 21761.0, 34075.0, 52989.0, 82495.0, 129726.0, 193510.0, 175237.0, 113171.0, 71329.0, 46019.0, 29680.0, 19181.0, 12604.0, 8176.0, 5424.0, 3586.0, 2434.0, 1577.0, 1099.0, 730.0, 488.0, 339.0, 252.0, 172.0, 122.0, 60.0, 56.0, 47.0, 31.0, 24.0, 12.0, 5.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.251953125, -0.24404144287109375, -0.2361297607421875, -0.22821807861328125, -0.220306396484375, -0.21239471435546875, -0.2044830322265625, -0.19657135009765625, -0.18865966796875, -0.18074798583984375, -0.1728363037109375, -0.16492462158203125, -0.157012939453125, -0.14910125732421875, -0.1411895751953125, -0.13327789306640625, -0.1253662109375, -0.11745452880859375, -0.1095428466796875, -0.10163116455078125, -0.093719482421875, -0.08580780029296875, -0.0778961181640625, -0.06998443603515625, -0.06207275390625, -0.05416107177734375, -0.0462493896484375, -0.03833770751953125, -0.030426025390625, -0.02251434326171875, -0.0146026611328125, -0.00669097900390625, 0.001220703125, 0.00913238525390625, 0.0170440673828125, 0.02495574951171875, 0.032867431640625, 0.04077911376953125, 0.0486907958984375, 0.05660247802734375, 0.06451416015625, 0.07242584228515625, 0.0803375244140625, 0.08824920654296875, 0.096160888671875, 0.10407257080078125, 0.1119842529296875, 0.11989593505859375, 0.1278076171875, 0.13571929931640625, 0.1436309814453125, 0.15154266357421875, 0.159454345703125, 0.16736602783203125, 0.1752777099609375, 0.18318939208984375, 0.19110107421875, 0.19901275634765625, 0.2069244384765625, 0.21483612060546875, 0.222747802734375, 0.23065948486328125, 0.2385711669921875, 0.24648284912109375, 0.25439453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 16.0, 10.0, 12.0, 18.0, 15.0, 14.0, 19.0, 27.0, 28.0, 28.0, 36.0, 36.0, 42.0, 28.0, 35.0, 26.0, 33.0, 34.0, 1055.0, 34.0, 32.0, 36.0, 30.0, 36.0, 30.0, 32.0, 28.0, 33.0, 24.0, 25.0, 27.0, 20.0, 29.0, 12.0, 11.0, 11.0, 13.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9921875, -7.7354736328125, -7.478759765625, -7.2220458984375, -6.96533203125, -6.7086181640625, -6.451904296875, -6.1951904296875, -5.9384765625, -5.6817626953125, -5.425048828125, -5.1683349609375, -4.91162109375, -4.6549072265625, -4.398193359375, -4.1414794921875, -3.884765625, -3.6280517578125, -3.371337890625, -3.1146240234375, -2.85791015625, -2.6011962890625, -2.344482421875, -2.0877685546875, -1.8310546875, -1.5743408203125, -1.317626953125, -1.0609130859375, -0.80419921875, -0.5474853515625, -0.290771484375, -0.0340576171875, 0.22265625, 0.4793701171875, 0.736083984375, 0.9927978515625, 1.24951171875, 1.5062255859375, 1.762939453125, 2.0196533203125, 2.2763671875, 2.5330810546875, 2.789794921875, 3.0465087890625, 3.30322265625, 3.5599365234375, 3.816650390625, 4.0733642578125, 4.330078125, 4.5867919921875, 4.843505859375, 5.1002197265625, 5.35693359375, 5.6136474609375, 5.870361328125, 6.1270751953125, 6.3837890625, 6.6405029296875, 6.897216796875, 7.1539306640625, 7.41064453125, 7.6673583984375, 7.924072265625, 8.1807861328125, 8.4375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 12.0, 12.0, 6.0, 29.0, 34.0, 55.0, 80.0, 92.0, 156.0, 206.0, 291.0, 398.0, 560.0, 764.0, 1138.0, 1611.0, 2183.0, 3201.0, 4589.0, 6509.0, 9522.0, 13725.0, 20087.0, 29447.0, 43131.0, 63589.0, 95331.0, 146462.0, 1235461.0, 138184.0, 90271.0, 60205.0, 40844.0, 27498.0, 18589.0, 12976.0, 8881.0, 6344.0, 4426.0, 2934.0, 2012.0, 1527.0, 1145.0, 754.0, 563.0, 392.0, 275.0, 184.0, 128.0, 101.0, 74.0, 57.0, 30.0, 24.0, 18.0, 11.0, 3.0, 3.0, 3.0, 1.0, 4.0], "bins": [-0.11627197265625, -0.11257266998291016, -0.10887336730957031, -0.10517406463623047, -0.10147476196289062, -0.09777545928955078, -0.09407615661621094, -0.0903768539428711, -0.08667755126953125, -0.0829782485961914, -0.07927894592285156, -0.07557964324951172, -0.07188034057617188, -0.06818103790283203, -0.06448173522949219, -0.060782432556152344, -0.0570831298828125, -0.053383827209472656, -0.04968452453613281, -0.04598522186279297, -0.042285919189453125, -0.03858661651611328, -0.03488731384277344, -0.031188011169433594, -0.02748870849609375, -0.023789405822753906, -0.020090103149414062, -0.01639080047607422, -0.012691497802734375, -0.008992195129394531, -0.0052928924560546875, -0.0015935897827148438, 0.002105712890625, 0.005805015563964844, 0.009504318237304688, 0.013203620910644531, 0.016902923583984375, 0.02060222625732422, 0.024301528930664062, 0.028000831604003906, 0.03170013427734375, 0.035399436950683594, 0.03909873962402344, 0.04279804229736328, 0.046497344970703125, 0.05019664764404297, 0.05389595031738281, 0.057595252990722656, 0.0612945556640625, 0.06499385833740234, 0.06869316101074219, 0.07239246368408203, 0.07609176635742188, 0.07979106903076172, 0.08349037170410156, 0.0871896743774414, 0.09088897705078125, 0.0945882797241211, 0.09828758239746094, 0.10198688507080078, 0.10568618774414062, 0.10938549041748047, 0.11308479309082031, 0.11678409576416016, 0.1204833984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 9.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 23.0, 33.0, 42.0, 36.0, 66.0, 42.0, 61.0, 47.0, 85.0, 61.0, 56.0, 56.0, 42.0, 48.0, 37.0, 36.0, 27.0, 21.0, 16.0, 14.0, 11.0, 5.0, 9.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0006504058837890625, -0.0006269589066505432, -0.0006035119295120239, -0.0005800649523735046, -0.0005566179752349854, -0.0005331709980964661, -0.0005097240209579468, -0.0004862770438194275, -0.0004628300666809082, -0.0004393830895423889, -0.00041593611240386963, -0.00039248913526535034, -0.00036904215812683105, -0.00034559518098831177, -0.0003221482038497925, -0.0002987012267112732, -0.0002752542495727539, -0.0002518072724342346, -0.00022836029529571533, -0.00020491331815719604, -0.00018146634101867676, -0.00015801936388015747, -0.00013457238674163818, -0.0001111254096031189, -8.767843246459961e-05, -6.423145532608032e-05, -4.0784478187561035e-05, -1.7337501049041748e-05, 6.109476089477539e-06, 2.9556453227996826e-05, 5.300343036651611e-05, 7.64504075050354e-05, 9.989738464355469e-05, 0.00012334436178207397, 0.00014679133892059326, 0.00017023831605911255, 0.00019368529319763184, 0.00021713227033615112, 0.0002405792474746704, 0.0002640262246131897, 0.000287473201751709, 0.00031092017889022827, 0.00033436715602874756, 0.00035781413316726685, 0.00038126111030578613, 0.0004047080874443054, 0.0004281550645828247, 0.000451602041721344, 0.0004750490188598633, 0.0004984959959983826, 0.0005219429731369019, 0.0005453899502754211, 0.0005688369274139404, 0.0005922839045524597, 0.000615730881690979, 0.0006391778588294983, 0.0006626248359680176, 0.0006860718131065369, 0.0007095187902450562, 0.0007329657673835754, 0.0007564127445220947, 0.000779859721660614, 0.0008033066987991333, 0.0008267536759376526, 0.0008502006530761719]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 8.0, 17.0, 17.0, 22.0, 31.0, 49.0, 40.0, 91.0, 91.0, 217.0, 580.0, 17410.0, 1026642.0, 2394.0, 377.0, 144.0, 115.0, 46.0, 56.0, 39.0, 26.0, 16.0, 16.0, 11.0, 13.0, 11.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02056884765625, -0.020002365112304688, -0.019435882568359375, -0.018869400024414062, -0.01830291748046875, -0.017736434936523438, -0.017169952392578125, -0.016603469848632812, -0.0160369873046875, -0.015470504760742188, -0.014904022216796875, -0.014337539672851562, -0.01377105712890625, -0.013204574584960938, -0.012638092041015625, -0.012071609497070312, -0.011505126953125, -0.010938644409179688, -0.010372161865234375, -0.009805679321289062, -0.00923919677734375, -0.008672714233398438, -0.008106231689453125, -0.0075397491455078125, -0.0069732666015625, -0.0064067840576171875, -0.005840301513671875, -0.0052738189697265625, -0.00470733642578125, -0.0041408538818359375, -0.003574371337890625, -0.0030078887939453125, -0.00244140625, -0.0018749237060546875, -0.001308441162109375, -0.0007419586181640625, -0.00017547607421875, 0.0003910064697265625, 0.000957489013671875, 0.0015239715576171875, 0.0020904541015625, 0.0026569366455078125, 0.003223419189453125, 0.0037899017333984375, 0.00435638427734375, 0.0049228668212890625, 0.005489349365234375, 0.0060558319091796875, 0.006622314453125, 0.0071887969970703125, 0.007755279541015625, 0.008321762084960938, 0.00888824462890625, 0.009454727172851562, 0.010021209716796875, 0.010587692260742188, 0.0111541748046875, 0.011720657348632812, 0.012287139892578125, 0.012853622436523438, 0.01342010498046875, 0.013986587524414062, 0.014553070068359375, 0.015119552612304688, 0.01568603515625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 21.0, 964.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013575304299592972, -0.013312075287103653, -0.013048846274614334, -0.01278561633080244, -0.012522387318313122, -0.012259158305823803, -0.011995929293334484, -0.01173269934952259, -0.011469470337033272, -0.011206241324543953, -0.010943012312054634, -0.01067978236824274, -0.010416553355753422, -0.010153324343264103, -0.009890095330774784, -0.00962686538696289, -0.009363636374473572, -0.009100407361984253, -0.008837178349494934, -0.00857394840568304, -0.008310719393193722, -0.008047490380704403, -0.007784261368215084, -0.007521031890064478, -0.007257803343236446, -0.0069945743307471275, -0.006731344852596521, -0.0064681158401072025, -0.006204886361956596, -0.0059416573494672775, -0.005678428336977959, -0.0054151988588273525, -0.005151968449354172, -0.004888739436864853, -0.004625509958714247, -0.004362280946224928, -0.004099051468074322, -0.003835822455585003, -0.0035725932102650404, -0.003309363964945078, -0.003046134952455759, -0.0027829057071357965, -0.002519676461815834, -0.002256447449326515, -0.001993217971175909, -0.0017299888422712684, -0.0014667597133666277, -0.0012035304680466652, -0.0009403012227267027, -0.0006770719774067402, -0.0004138427902944386, -0.000150613603182137, 0.00011261564213782549, 0.000375844887457788, 0.0006390740163624287, 0.0009023032616823912, 0.0011655325070023537, 0.0014287617523223162, 0.0016919909976422787, 0.0019552200101315975, 0.0022184494882822037, 0.0024816785007715225, 0.002744907746091485, 0.0030081369914114475, 0.00327136623673141]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 23.0, 25.0, 31.0, 31.0, 56.0, 52.0, 70.0, 73.0, 93.0, 68.0, 83.0, 67.0, 61.0, 46.0, 53.0, 45.0, 33.0, 26.0, 21.0, 5.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000981152057647705, -0.0009465292096138, -0.000911906361579895, -0.00087728351354599, -0.000842660665512085, -0.0008080378174781799, -0.0007734149694442749, -0.0007387921214103699, -0.0007041692733764648, -0.0006695464253425598, -0.0006349235773086548, -0.0006003007292747498, -0.0005656778812408447, -0.0005310550332069397, -0.0004964321851730347, -0.00046180933713912964, -0.0004271864891052246, -0.0003925636410713196, -0.00035794079303741455, -0.0003233179450035095, -0.0002886950969696045, -0.00025407224893569946, -0.00021944940090179443, -0.0001848265528678894, -0.00015020370483398438, -0.00011558085680007935, -8.095800876617432e-05, -4.633516073226929e-05, -1.1712312698364258e-05, 2.291053533554077e-05, 5.75333833694458e-05, 9.215623140335083e-05, 0.00012677907943725586, 0.0001614019274711609, 0.00019602477550506592, 0.00023064762353897095, 0.000265270471572876, 0.000299893319606781, 0.00033451616764068604, 0.00036913901567459106, 0.0004037618637084961, 0.0004383847117424011, 0.00047300755977630615, 0.0005076304078102112, 0.0005422532558441162, 0.0005768761038780212, 0.0006114989519119263, 0.0006461217999458313, 0.0006807446479797363, 0.0007153674960136414, 0.0007499903440475464, 0.0007846131920814514, 0.0008192360401153564, 0.0008538588881492615, 0.0008884817361831665, 0.0009231045842170715, 0.0009577274322509766, 0.0009923502802848816, 0.0010269731283187866, 0.0010615959763526917, 0.0010962188243865967, 0.0011308416724205017, 0.0011654645204544067, 0.0012000873684883118, 0.0012347102165222168]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 23.0, 27.0, 47.0, 64.0, 76.0, 114.0, 143.0, 217.0, 275.0, 389.0, 542.0, 839.0, 1216.0, 1710.0, 2669.0, 3970.0, 6194.0, 10212.0, 17637.0, 35771.0, 123558.0, 606771.0, 147948.0, 39043.0, 18968.0, 10721.0, 6557.0, 4097.0, 2784.0, 1787.0, 1241.0, 859.0, 604.0, 425.0, 294.0, 195.0, 144.0, 107.0, 85.0, 55.0, 40.0, 35.0, 22.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-18.609375, -18.0546875, -17.5, -16.9453125, -16.390625, -15.8359375, -15.28125, -14.7265625, -14.171875, -13.6171875, -13.0625, -12.5078125, -11.953125, -11.3984375, -10.84375, -10.2890625, -9.734375, -9.1796875, -8.625, -8.0703125, -7.515625, -6.9609375, -6.40625, -5.8515625, -5.296875, -4.7421875, -4.1875, -3.6328125, -3.078125, -2.5234375, -1.96875, -1.4140625, -0.859375, -0.3046875, 0.25, 0.8046875, 1.359375, 1.9140625, 2.46875, 3.0234375, 3.578125, 4.1328125, 4.6875, 5.2421875, 5.796875, 6.3515625, 6.90625, 7.4609375, 8.015625, 8.5703125, 9.125, 9.6796875, 10.234375, 10.7890625, 11.34375, 11.8984375, 12.453125, 13.0078125, 13.5625, 14.1171875, 14.671875, 15.2265625, 15.78125, 16.3359375, 16.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 12.0, 19.0, 13.0, 16.0, 19.0, 14.0, 20.0, 32.0, 30.0, 38.0, 33.0, 38.0, 46.0, 49.0, 68.0, 101.0, 422.0, 1452.0, 113.0, 73.0, 61.0, 41.0, 48.0, 30.0, 39.0, 35.0, 31.0, 17.0, 32.0, 13.0, 16.0, 14.0, 14.0, 5.0, 9.0, 4.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.5625, -38.36376953125, -37.1650390625, -35.96630859375, -34.767578125, -33.56884765625, -32.3701171875, -31.17138671875, -29.97265625, -28.77392578125, -27.5751953125, -26.37646484375, -25.177734375, -23.97900390625, -22.7802734375, -21.58154296875, -20.3828125, -19.18408203125, -17.9853515625, -16.78662109375, -15.587890625, -14.38916015625, -13.1904296875, -11.99169921875, -10.79296875, -9.59423828125, -8.3955078125, -7.19677734375, -5.998046875, -4.79931640625, -3.6005859375, -2.40185546875, -1.203125, -0.00439453125, 1.1943359375, 2.39306640625, 3.591796875, 4.79052734375, 5.9892578125, 7.18798828125, 8.38671875, 9.58544921875, 10.7841796875, 11.98291015625, 13.181640625, 14.38037109375, 15.5791015625, 16.77783203125, 17.9765625, 19.17529296875, 20.3740234375, 21.57275390625, 22.771484375, 23.97021484375, 25.1689453125, 26.36767578125, 27.56640625, 28.76513671875, 29.9638671875, 31.16259765625, 32.361328125, 33.56005859375, 34.7587890625, 35.95751953125, 37.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 10.0, 7.0, 21.0, 25.0, 24.0, 35.0, 56.0, 49.0, 78.0, 117.0, 189.0, 316.0, 627.0, 1569.0, 4319.0, 14289.0, 63878.0, 2662290.0, 349577.0, 34120.0, 8918.0, 2792.0, 1076.0, 481.0, 247.0, 159.0, 112.0, 80.0, 44.0, 39.0, 31.0, 28.0, 19.0, 17.0, 12.0, 11.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.34375, -47.7421875, -46.140625, -44.5390625, -42.9375, -41.3359375, -39.734375, -38.1328125, -36.53125, -34.9296875, -33.328125, -31.7265625, -30.125, -28.5234375, -26.921875, -25.3203125, -23.71875, -22.1171875, -20.515625, -18.9140625, -17.3125, -15.7109375, -14.109375, -12.5078125, -10.90625, -9.3046875, -7.703125, -6.1015625, -4.5, -2.8984375, -1.296875, 0.3046875, 1.90625, 3.5078125, 5.109375, 6.7109375, 8.3125, 9.9140625, 11.515625, 13.1171875, 14.71875, 16.3203125, 17.921875, 19.5234375, 21.125, 22.7265625, 24.328125, 25.9296875, 27.53125, 29.1328125, 30.734375, 32.3359375, 33.9375, 35.5390625, 37.140625, 38.7421875, 40.34375, 41.9453125, 43.546875, 45.1484375, 46.75, 48.3515625, 49.953125, 51.5546875, 53.15625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 29.0, 97.0, 230.0, 314.0, 219.0, 76.0, 22.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84812545776367, -47.24433898925781, -41.64055252075195, -36.036766052246094, -30.432979583740234, -24.829193115234375, -19.225406646728516, -13.621620178222656, -8.017833709716797, -2.4140472412109375, 3.189739227294922, 8.793525695800781, 14.39731216430664, 20.0010986328125, 25.60488510131836, 31.20867156982422, 36.81245803833008, 42.41624450683594, 48.0200309753418, 53.623817443847656, 59.227603912353516, 64.83139038085938, 70.4351806640625, 76.0389633178711, 81.64274597167969, 87.24653625488281, 92.8503189086914, 98.4541015625, 104.05789184570312, 109.66168212890625, 115.26546478271484, 120.86924743652344, 126.47305297851562, 132.07684326171875, 137.68063354492188, 143.28440856933594, 148.88819885253906, 154.4919891357422, 160.09576416015625, 165.69955444335938, 171.3033447265625, 176.90713500976562, 182.51092529296875, 188.1147003173828, 193.71849060058594, 199.32228088378906, 204.92605590820312, 210.52984619140625, 216.13363647460938, 221.7374267578125, 227.34121704101562, 232.9449920654297, 238.5487823486328, 244.15257263183594, 249.75634765625, 255.36013793945312, 260.96392822265625, 266.5677185058594, 272.1715087890625, 277.7752990722656, 283.37908935546875, 288.98284912109375, 294.5866394042969, 300.1904296875, 305.7942199707031]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 9.0, 2.0, 7.0, 11.0, 8.0, 14.0, 10.0, 18.0, 17.0, 19.0, 15.0, 25.0, 36.0, 33.0, 31.0, 35.0, 32.0, 46.0, 34.0, 43.0, 45.0, 47.0, 37.0, 34.0, 30.0, 38.0, 28.0, 36.0, 26.0, 32.0, 30.0, 19.0, 23.0, 20.0, 18.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-104.2725830078125, -101.24817657470703, -98.22377014160156, -95.1993637084961, -92.17495727539062, -89.15054321289062, -86.12614440917969, -83.10173034667969, -80.07732391357422, -77.05291748046875, -74.02851104736328, -71.00410461425781, -67.97969818115234, -64.95529174804688, -61.93088150024414, -58.906471252441406, -55.8820686340332, -52.857662200927734, -49.833255767822266, -46.80884552001953, -43.78443908691406, -40.760032653808594, -37.735626220703125, -34.711219787597656, -31.686811447143555, -28.662405014038086, -25.637996673583984, -22.613590240478516, -19.589183807373047, -16.564775466918945, -13.540369033813477, -10.515960693359375, -7.491554260253906, -4.467146873474121, -1.4427399635314941, 1.5816669464111328, 4.606074333190918, 7.630481719970703, 10.654888153076172, 13.679296493530273, 16.703702926635742, 19.72810935974121, 22.752517700195312, 25.77692413330078, 28.80133056640625, 31.82573890686035, 34.85014343261719, 37.87455368041992, 40.89896011352539, 43.92336654663086, 46.94777297973633, 49.97218322753906, 52.99658966064453, 56.02099609375, 59.04540252685547, 62.06980895996094, 65.0942153930664, 68.11862182617188, 71.14302825927734, 74.16743469238281, 77.19184112548828, 80.21624755859375, 83.24066162109375, 86.26506805419922, 89.28947448730469]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 3.0, 11.0, 11.0, 15.0, 19.0, 19.0, 11.0, 27.0, 26.0, 39.0, 23.0, 18.0, 26.0, 32.0, 43.0, 40.0, 49.0, 33.0, 41.0, 49.0, 41.0, 47.0, 35.0, 50.0, 37.0, 30.0, 27.0, 37.0, 17.0, 24.0, 22.0, 13.0, 11.0, 14.0, 12.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.4041748046875, -12.995849609375, -12.5875244140625, -12.17919921875, -11.7708740234375, -11.362548828125, -10.9542236328125, -10.5458984375, -10.1375732421875, -9.729248046875, -9.3209228515625, -8.91259765625, -8.5042724609375, -8.095947265625, -7.6876220703125, -7.279296875, -6.8709716796875, -6.462646484375, -6.0543212890625, -5.64599609375, -5.2376708984375, -4.829345703125, -4.4210205078125, -4.0126953125, -3.6043701171875, -3.196044921875, -2.7877197265625, -2.37939453125, -1.9710693359375, -1.562744140625, -1.1544189453125, -0.74609375, -0.3377685546875, 0.070556640625, 0.4788818359375, 0.88720703125, 1.2955322265625, 1.703857421875, 2.1121826171875, 2.5205078125, 2.9288330078125, 3.337158203125, 3.7454833984375, 4.15380859375, 4.5621337890625, 4.970458984375, 5.3787841796875, 5.787109375, 6.1954345703125, 6.603759765625, 7.0120849609375, 7.42041015625, 7.8287353515625, 8.237060546875, 8.6453857421875, 9.0537109375, 9.4620361328125, 9.870361328125, 10.2786865234375, 10.68701171875, 11.0953369140625, 11.503662109375, 11.9119873046875, 12.3203125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 7.0, 7.0, 9.0, 7.0, 9.0, 21.0, 22.0, 34.0, 34.0, 64.0, 100.0, 182.0, 286.0, 469.0, 953.0, 1783.0, 3376.0, 7161.0, 16217.0, 45591.0, 302019.0, 2766672.0, 920398.0, 85894.0, 23397.0, 9929.0, 4473.0, 2359.0, 1183.0, 636.0, 369.0, 220.0, 134.0, 76.0, 38.0, 47.0, 17.0, 21.0, 8.0, 13.0, 9.0, 4.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.546875, -26.64990234375, -25.7529296875, -24.85595703125, -23.958984375, -23.06201171875, -22.1650390625, -21.26806640625, -20.37109375, -19.47412109375, -18.5771484375, -17.68017578125, -16.783203125, -15.88623046875, -14.9892578125, -14.09228515625, -13.1953125, -12.29833984375, -11.4013671875, -10.50439453125, -9.607421875, -8.71044921875, -7.8134765625, -6.91650390625, -6.01953125, -5.12255859375, -4.2255859375, -3.32861328125, -2.431640625, -1.53466796875, -0.6376953125, 0.25927734375, 1.15625, 2.05322265625, 2.9501953125, 3.84716796875, 4.744140625, 5.64111328125, 6.5380859375, 7.43505859375, 8.33203125, 9.22900390625, 10.1259765625, 11.02294921875, 11.919921875, 12.81689453125, 13.7138671875, 14.61083984375, 15.5078125, 16.40478515625, 17.3017578125, 18.19873046875, 19.095703125, 19.99267578125, 20.8896484375, 21.78662109375, 22.68359375, 23.58056640625, 24.4775390625, 25.37451171875, 26.271484375, 27.16845703125, 28.0654296875, 28.96240234375, 29.859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 7.0, 2.0, 8.0, 13.0, 13.0, 11.0, 15.0, 27.0, 36.0, 39.0, 59.0, 73.0, 108.0, 162.0, 317.0, 589.0, 842.0, 693.0, 383.0, 228.0, 129.0, 88.0, 61.0, 35.0, 25.0, 29.0, 21.0, 13.0, 12.0, 7.0, 13.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.60205078125, -22.7509765625, -21.89990234375, -21.048828125, -20.19775390625, -19.3466796875, -18.49560546875, -17.64453125, -16.79345703125, -15.9423828125, -15.09130859375, -14.240234375, -13.38916015625, -12.5380859375, -11.68701171875, -10.8359375, -9.98486328125, -9.1337890625, -8.28271484375, -7.431640625, -6.58056640625, -5.7294921875, -4.87841796875, -4.02734375, -3.17626953125, -2.3251953125, -1.47412109375, -0.623046875, 0.22802734375, 1.0791015625, 1.93017578125, 2.78125, 3.63232421875, 4.4833984375, 5.33447265625, 6.185546875, 7.03662109375, 7.8876953125, 8.73876953125, 9.58984375, 10.44091796875, 11.2919921875, 12.14306640625, 12.994140625, 13.84521484375, 14.6962890625, 15.54736328125, 16.3984375, 17.24951171875, 18.1005859375, 18.95166015625, 19.802734375, 20.65380859375, 21.5048828125, 22.35595703125, 23.20703125, 24.05810546875, 24.9091796875, 25.76025390625, 26.611328125, 27.46240234375, 28.3134765625, 29.16455078125, 30.015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 11.0, 16.0, 16.0, 24.0, 33.0, 35.0, 96.0, 138.0, 298.0, 955.0, 4823.0, 52995.0, 3789833.0, 327813.0, 14128.0, 2025.0, 508.0, 175.0, 125.0, 74.0, 35.0, 34.0, 15.0, 18.0, 9.0, 10.0, 12.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-119.25, -116.0048828125, -112.759765625, -109.5146484375, -106.26953125, -103.0244140625, -99.779296875, -96.5341796875, -93.2890625, -90.0439453125, -86.798828125, -83.5537109375, -80.30859375, -77.0634765625, -73.818359375, -70.5732421875, -67.328125, -64.0830078125, -60.837890625, -57.5927734375, -54.34765625, -51.1025390625, -47.857421875, -44.6123046875, -41.3671875, -38.1220703125, -34.876953125, -31.6318359375, -28.38671875, -25.1416015625, -21.896484375, -18.6513671875, -15.40625, -12.1611328125, -8.916015625, -5.6708984375, -2.42578125, 0.8193359375, 4.064453125, 7.3095703125, 10.5546875, 13.7998046875, 17.044921875, 20.2900390625, 23.53515625, 26.7802734375, 30.025390625, 33.2705078125, 36.515625, 39.7607421875, 43.005859375, 46.2509765625, 49.49609375, 52.7412109375, 55.986328125, 59.2314453125, 62.4765625, 65.7216796875, 68.966796875, 72.2119140625, 75.45703125, 78.7021484375, 81.947265625, 85.1923828125, 88.4375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 26.0, 61.0, 182.0, 300.0, 241.0, 135.0, 38.0, 18.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.0019226074219, -386.23809814453125, -378.4742431640625, -370.7104187011719, -362.94659423828125, -355.1827392578125, -347.4189147949219, -339.65509033203125, -331.8912353515625, -324.1274108886719, -316.3635559082031, -308.5997314453125, -300.8359069824219, -293.0720520019531, -285.3082275390625, -277.5444030761719, -269.78057861328125, -262.0167541503906, -254.25291442871094, -246.48907470703125, -238.72523498535156, -230.96139526367188, -223.19757080078125, -215.43373107910156, -207.66989135742188, -199.9060516357422, -192.14222717285156, -184.37838745117188, -176.6145477294922, -168.8507080078125, -161.08688354492188, -153.3230438232422, -145.5592041015625, -137.7953643798828, -130.0315399169922, -122.2677001953125, -114.50386047363281, -106.74002838134766, -98.9761962890625, -91.21235656738281, -83.44851684570312, -75.68468475341797, -67.92084503173828, -60.157012939453125, -52.3931770324707, -44.62934112548828, -36.865509033203125, -29.101673126220703, -21.33783721923828, -13.574002265930176, -5.81016731262207, 1.9536666870117188, 9.71750259399414, 17.481338500976562, 25.24517059326172, 33.00900650024414, 40.77284240722656, 48.536678314208984, 56.300514221191406, 64.06434631347656, 71.82818603515625, 79.5920181274414, 87.35585021972656, 95.11968994140625, 102.8835220336914]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 6.0, 17.0, 6.0, 10.0, 16.0, 20.0, 15.0, 16.0, 22.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 38.0, 34.0, 29.0, 39.0, 41.0, 54.0, 37.0, 36.0, 31.0, 43.0, 26.0, 31.0, 39.0, 23.0, 31.0, 19.0, 23.0, 25.0, 16.0, 11.0, 18.0, 16.0, 13.0, 13.0, 5.0, 4.0, 2.0, 6.0, 8.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-63.54621124267578, -61.51509475708008, -59.48397445678711, -57.452857971191406, -55.42173767089844, -53.390621185302734, -51.35950469970703, -49.32838439941406, -47.29726791381836, -45.266151428222656, -43.23503112792969, -41.203914642333984, -39.17279815673828, -37.14167785644531, -35.11056137084961, -33.079444885253906, -31.048324584960938, -29.0172061920166, -26.986087799072266, -24.954971313476562, -22.923852920532227, -20.89273452758789, -18.861618041992188, -16.83049964904785, -14.799381256103516, -12.76826286315918, -10.73714542388916, -8.70602798461914, -6.674909591674805, -4.643791198730469, -2.612673759460449, -0.5815563201904297, 1.4495697021484375, 3.4806876182556152, 5.511805534362793, 7.542923450469971, 9.574041366577148, 11.605159759521484, 13.636277198791504, 15.667394638061523, 17.69851303100586, 19.729631423950195, 21.76074981689453, 23.791866302490234, 25.82298469543457, 27.854103088378906, 29.88521957397461, 31.916337966918945, 33.94745635986328, 35.978572845458984, 38.00969314575195, 40.040809631347656, 42.071929931640625, 44.10304641723633, 46.13416290283203, 48.165283203125, 50.1963996887207, 52.227516174316406, 54.258636474609375, 56.28975296020508, 58.32086944580078, 60.35198974609375, 62.38310623168945, 64.41422271728516, 66.44534301757812]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 2.0, 11.0, 8.0, 13.0, 18.0, 31.0, 64.0, 78.0, 125.0, 171.0, 296.0, 453.0, 611.0, 1011.0, 1528.0, 2489.0, 3766.0, 6053.0, 9641.0, 15366.0, 25308.0, 41255.0, 67680.0, 109192.0, 170836.0, 216263.0, 142470.0, 89579.0, 55354.0, 33533.0, 20693.0, 12650.0, 8029.0, 5071.0, 3124.0, 2032.0, 1274.0, 840.0, 580.0, 352.0, 242.0, 155.0, 99.0, 65.0, 47.0, 31.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.31201171875, -0.3029136657714844, -0.29381561279296875, -0.2847175598144531, -0.2756195068359375, -0.2665214538574219, -0.25742340087890625, -0.24832534790039062, -0.239227294921875, -0.23012924194335938, -0.22103118896484375, -0.21193313598632812, -0.2028350830078125, -0.19373703002929688, -0.18463897705078125, -0.17554092407226562, -0.16644287109375, -0.15734481811523438, -0.14824676513671875, -0.13914871215820312, -0.1300506591796875, -0.12095260620117188, -0.11185455322265625, -0.10275650024414062, -0.093658447265625, -0.08456039428710938, -0.07546234130859375, -0.06636428833007812, -0.0572662353515625, -0.048168182373046875, -0.03907012939453125, -0.029972076416015625, -0.0208740234375, -0.011775970458984375, -0.00267791748046875, 0.006420135498046875, 0.0155181884765625, 0.024616241455078125, 0.03371429443359375, 0.042812347412109375, 0.051910400390625, 0.061008453369140625, 0.07010650634765625, 0.07920455932617188, 0.0883026123046875, 0.09740066528320312, 0.10649871826171875, 0.11559677124023438, 0.12469482421875, 0.13379287719726562, 0.14289093017578125, 0.15198898315429688, 0.1610870361328125, 0.17018508911132812, 0.17928314208984375, 0.18838119506835938, 0.197479248046875, 0.20657730102539062, 0.21567535400390625, 0.22477340698242188, 0.2338714599609375, 0.24296951293945312, 0.25206756591796875, 0.2611656188964844, 0.270263671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 14.0, 14.0, 18.0, 20.0, 18.0, 15.0, 28.0, 28.0, 28.0, 34.0, 28.0, 31.0, 46.0, 37.0, 35.0, 36.0, 43.0, 1063.0, 28.0, 34.0, 37.0, 25.0, 34.0, 39.0, 29.0, 25.0, 25.0, 30.0, 20.0, 19.0, 17.0, 17.0, 13.0, 15.0, 7.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.6484375, -9.3492431640625, -9.050048828125, -8.7508544921875, -8.45166015625, -8.1524658203125, -7.853271484375, -7.5540771484375, -7.2548828125, -6.9556884765625, -6.656494140625, -6.3572998046875, -6.05810546875, -5.7589111328125, -5.459716796875, -5.1605224609375, -4.861328125, -4.5621337890625, -4.262939453125, -3.9637451171875, -3.66455078125, -3.3653564453125, -3.066162109375, -2.7669677734375, -2.4677734375, -2.1685791015625, -1.869384765625, -1.5701904296875, -1.27099609375, -0.9718017578125, -0.672607421875, -0.3734130859375, -0.07421875, 0.2249755859375, 0.524169921875, 0.8233642578125, 1.12255859375, 1.4217529296875, 1.720947265625, 2.0201416015625, 2.3193359375, 2.6185302734375, 2.917724609375, 3.2169189453125, 3.51611328125, 3.8153076171875, 4.114501953125, 4.4136962890625, 4.712890625, 5.0120849609375, 5.311279296875, 5.6104736328125, 5.90966796875, 6.2088623046875, 6.508056640625, 6.8072509765625, 7.1064453125, 7.4056396484375, 7.704833984375, 8.0040283203125, 8.30322265625, 8.6024169921875, 8.901611328125, 9.2008056640625, 9.5]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 9.0, 17.0, 26.0, 44.0, 60.0, 80.0, 121.0, 174.0, 222.0, 344.0, 459.0, 669.0, 979.0, 1348.0, 1968.0, 2793.0, 4209.0, 6275.0, 9380.0, 14070.0, 21643.0, 33014.0, 51496.0, 80813.0, 133304.0, 1252117.0, 177618.0, 109312.0, 67486.0, 43410.0, 27872.0, 18331.0, 12229.0, 8118.0, 5278.0, 3718.0, 2455.0, 1744.0, 1191.0, 863.0, 556.0, 379.0, 274.0, 203.0, 138.0, 104.0, 73.0, 56.0, 31.0, 15.0, 20.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.1551513671875, -0.150421142578125, -0.14569091796875, -0.140960693359375, -0.13623046875, -0.131500244140625, -0.12677001953125, -0.122039794921875, -0.1173095703125, -0.112579345703125, -0.10784912109375, -0.103118896484375, -0.098388671875, -0.093658447265625, -0.08892822265625, -0.084197998046875, -0.0794677734375, -0.074737548828125, -0.07000732421875, -0.065277099609375, -0.060546875, -0.055816650390625, -0.05108642578125, -0.046356201171875, -0.0416259765625, -0.036895751953125, -0.03216552734375, -0.027435302734375, -0.022705078125, -0.017974853515625, -0.01324462890625, -0.008514404296875, -0.0037841796875, 0.000946044921875, 0.00567626953125, 0.010406494140625, 0.01513671875, 0.019866943359375, 0.02459716796875, 0.029327392578125, 0.0340576171875, 0.038787841796875, 0.04351806640625, 0.048248291015625, 0.052978515625, 0.057708740234375, 0.06243896484375, 0.067169189453125, 0.0718994140625, 0.076629638671875, 0.08135986328125, 0.086090087890625, 0.0908203125, 0.095550537109375, 0.10028076171875, 0.105010986328125, 0.1097412109375, 0.114471435546875, 0.11920166015625, 0.123931884765625, 0.128662109375, 0.133392333984375, 0.13812255859375, 0.142852783203125, 0.1475830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 11.0, 10.0, 15.0, 18.0, 20.0, 27.0, 35.0, 43.0, 51.0, 70.0, 53.0, 62.0, 76.0, 72.0, 79.0, 65.0, 50.0, 42.0, 43.0, 28.0, 19.0, 23.0, 15.0, 17.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010423660278320312, -0.0010128617286682129, -0.0009833574295043945, -0.0009538531303405762, -0.0009243488311767578, -0.0008948445320129395, -0.0008653402328491211, -0.0008358359336853027, -0.0008063316345214844, -0.000776827335357666, -0.0007473230361938477, -0.0007178187370300293, -0.0006883144378662109, -0.0006588101387023926, -0.0006293058395385742, -0.0005998015403747559, -0.0005702972412109375, -0.0005407929420471191, -0.0005112886428833008, -0.0004817843437194824, -0.00045228004455566406, -0.0004227757453918457, -0.00039327144622802734, -0.000363767147064209, -0.0003342628479003906, -0.00030475854873657227, -0.0002752542495727539, -0.00024574995040893555, -0.0002162456512451172, -0.00018674135208129883, -0.00015723705291748047, -0.0001277327537536621, -9.822845458984375e-05, -6.872415542602539e-05, -3.921985626220703e-05, -9.715557098388672e-06, 1.9788742065429688e-05, 4.929304122924805e-05, 7.87973403930664e-05, 0.00010830163955688477, 0.00013780593872070312, 0.00016731023788452148, 0.00019681453704833984, 0.0002263188362121582, 0.00025582313537597656, 0.0002853274345397949, 0.0003148317337036133, 0.00034433603286743164, 0.00037384033203125, 0.00040334463119506836, 0.0004328489303588867, 0.0004623532295227051, 0.0004918575286865234, 0.0005213618278503418, 0.0005508661270141602, 0.0005803704261779785, 0.0006098747253417969, 0.0006393790245056152, 0.0006688833236694336, 0.000698387622833252, 0.0007278919219970703, 0.0007573962211608887, 0.000786900520324707, 0.0008164048194885254, 0.0008459091186523438]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 16.0, 17.0, 23.0, 21.0, 39.0, 49.0, 55.0, 93.0, 169.0, 384.0, 2094.0, 1033817.0, 10620.0, 555.0, 196.0, 112.0, 71.0, 48.0, 32.0, 23.0, 21.0, 16.0, 8.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01959228515625, -0.018908977508544922, -0.018225669860839844, -0.017542362213134766, -0.016859054565429688, -0.01617574691772461, -0.015492439270019531, -0.014809131622314453, -0.014125823974609375, -0.013442516326904297, -0.012759208679199219, -0.01207590103149414, -0.011392593383789062, -0.010709285736083984, -0.010025978088378906, -0.009342670440673828, -0.00865936279296875, -0.007976055145263672, -0.007292747497558594, -0.006609439849853516, -0.0059261322021484375, -0.005242824554443359, -0.004559516906738281, -0.003876209259033203, -0.003192901611328125, -0.002509593963623047, -0.0018262863159179688, -0.0011429786682128906, -0.0004596710205078125, 0.00022363662719726562, 0.0009069442749023438, 0.0015902519226074219, 0.0022735595703125, 0.002956867218017578, 0.0036401748657226562, 0.004323482513427734, 0.0050067901611328125, 0.005690097808837891, 0.006373405456542969, 0.007056713104248047, 0.007740020751953125, 0.008423328399658203, 0.009106636047363281, 0.00978994369506836, 0.010473251342773438, 0.011156558990478516, 0.011839866638183594, 0.012523174285888672, 0.01320648193359375, 0.013889789581298828, 0.014573097229003906, 0.015256404876708984, 0.015939712524414062, 0.01662302017211914, 0.01730632781982422, 0.017989635467529297, 0.018672943115234375, 0.019356250762939453, 0.02003955841064453, 0.02072286605834961, 0.021406173706054688, 0.022089481353759766, 0.022772789001464844, 0.023456096649169922, 0.024139404296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 21.0, 994.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027796540409326553, -0.02728552557528019, -0.026774512603878975, -0.02626349776983261, -0.025752484798431396, -0.025241469964385033, -0.024730456992983818, -0.024219442158937454, -0.02370842918753624, -0.023197414353489876, -0.02268640138208866, -0.022175386548042297, -0.021664373576641083, -0.02115335874259472, -0.020642345771193504, -0.02013133093714714, -0.019620317965745926, -0.019109303131699562, -0.018598290160298347, -0.018087275326251984, -0.01757626235485077, -0.017065247520804405, -0.01655423454940319, -0.016043219715356827, -0.015532204881310463, -0.015021190978586674, -0.014510177075862885, -0.013999163173139095, -0.013488149270415306, -0.012977135367691517, -0.012466121464967728, -0.011955106630921364, -0.011444094590842724, -0.010933080688118935, -0.010422066785395145, -0.009911052882671356, -0.009400038979947567, -0.008889025077223778, -0.008378010243177414, -0.0078669972717762, -0.007355982903391123, -0.006844969000667334, -0.006333955097943544, -0.005822940729558468, -0.005311926826834679, -0.0048009129241108894, -0.0042898990213871, -0.003778885118663311, -0.003267871215939522, -0.0027568573132157326, -0.0022458434104919434, -0.0017348292749375105, -0.0012238153722137213, -0.0007128014694899321, -0.0002017873339354992, 0.00030922656878829, 0.0008202404715120792, 0.0013312543742358685, 0.0018422683933749795, 0.0023532824125140905, 0.0028642963152378798, 0.003375310217961669, 0.003886324353516102, 0.004397338256239891, 0.00490835215896368]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 20.0, 20.0, 48.0, 35.0, 46.0, 70.0, 59.0, 57.0, 97.0, 95.0, 87.0, 54.0, 69.0, 55.0, 51.0, 39.0, 20.0, 31.0, 17.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010976195335388184, -0.0010590441524982452, -0.0010204687714576721, -0.000981893390417099, -0.0009433180093765259, -0.0009047426283359528, -0.0008661672472953796, -0.0008275918662548065, -0.0007890164852142334, -0.0007504411041736603, -0.0007118657231330872, -0.000673290342092514, -0.0006347149610519409, -0.0005961395800113678, -0.0005575641989707947, -0.0005189888179302216, -0.00048041343688964844, -0.0004418380558490753, -0.0004032626748085022, -0.0003646872937679291, -0.00032611191272735596, -0.00028753653168678284, -0.0002489611506462097, -0.0002103857696056366, -0.00017181038856506348, -0.00013323500752449036, -9.465962648391724e-05, -5.6084245443344116e-05, -1.7508864402770996e-05, 2.1066516637802124e-05, 5.9641897678375244e-05, 9.821727871894836e-05, 0.00013679265975952148, 0.0001753680408000946, 0.00021394342184066772, 0.00025251880288124084, 0.00029109418392181396, 0.0003296695649623871, 0.0003682449460029602, 0.0004068203270435333, 0.00044539570808410645, 0.00048397108912467957, 0.0005225464701652527, 0.0005611218512058258, 0.0005996972322463989, 0.000638272613286972, 0.0006768479943275452, 0.0007154233753681183, 0.0007539987564086914, 0.0007925741374492645, 0.0008311495184898376, 0.0008697248995304108, 0.0009083002805709839, 0.000946875661611557, 0.0009854510426521301, 0.0010240264236927032, 0.0010626018047332764, 0.0011011771857738495, 0.0011397525668144226, 0.0011783279478549957, 0.0012169033288955688, 0.001255478709936142, 0.001294054090976715, 0.0013326294720172882, 0.0013712048530578613]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 12.0, 12.0, 8.0, 24.0, 21.0, 32.0, 56.0, 75.0, 100.0, 174.0, 268.0, 451.0, 760.0, 1283.0, 2078.0, 3496.0, 6501.0, 13329.0, 67869.0, 842644.0, 79158.0, 14402.0, 6640.0, 3655.0, 2162.0, 1283.0, 775.0, 482.0, 283.0, 171.0, 96.0, 73.0, 47.0, 39.0, 22.0, 18.0, 8.0, 12.0, 8.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.875, -27.01806640625, -26.1611328125, -25.30419921875, -24.447265625, -23.59033203125, -22.7333984375, -21.87646484375, -21.01953125, -20.16259765625, -19.3056640625, -18.44873046875, -17.591796875, -16.73486328125, -15.8779296875, -15.02099609375, -14.1640625, -13.30712890625, -12.4501953125, -11.59326171875, -10.736328125, -9.87939453125, -9.0224609375, -8.16552734375, -7.30859375, -6.45166015625, -5.5947265625, -4.73779296875, -3.880859375, -3.02392578125, -2.1669921875, -1.31005859375, -0.453125, 0.40380859375, 1.2607421875, 2.11767578125, 2.974609375, 3.83154296875, 4.6884765625, 5.54541015625, 6.40234375, 7.25927734375, 8.1162109375, 8.97314453125, 9.830078125, 10.68701171875, 11.5439453125, 12.40087890625, 13.2578125, 14.11474609375, 14.9716796875, 15.82861328125, 16.685546875, 17.54248046875, 18.3994140625, 19.25634765625, 20.11328125, 20.97021484375, 21.8271484375, 22.68408203125, 23.541015625, 24.39794921875, 25.2548828125, 26.11181640625, 26.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 3.0, 7.0, 12.0, 20.0, 14.0, 16.0, 17.0, 25.0, 24.0, 41.0, 28.0, 39.0, 48.0, 55.0, 69.0, 79.0, 487.0, 1585.0, 85.0, 58.0, 48.0, 42.0, 54.0, 33.0, 32.0, 27.0, 29.0, 13.0, 9.0, 14.0, 10.0, 8.0, 1.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.951171875, -43.40234375, -41.853515625, -40.3046875, -38.755859375, -37.20703125, -35.658203125, -34.109375, -32.560546875, -31.01171875, -29.462890625, -27.9140625, -26.365234375, -24.81640625, -23.267578125, -21.71875, -20.169921875, -18.62109375, -17.072265625, -15.5234375, -13.974609375, -12.42578125, -10.876953125, -9.328125, -7.779296875, -6.23046875, -4.681640625, -3.1328125, -1.583984375, -0.03515625, 1.513671875, 3.0625, 4.611328125, 6.16015625, 7.708984375, 9.2578125, 10.806640625, 12.35546875, 13.904296875, 15.453125, 17.001953125, 18.55078125, 20.099609375, 21.6484375, 23.197265625, 24.74609375, 26.294921875, 27.84375, 29.392578125, 30.94140625, 32.490234375, 34.0390625, 35.587890625, 37.13671875, 38.685546875, 40.234375, 41.783203125, 43.33203125, 44.880859375, 46.4296875, 47.978515625, 49.52734375, 51.076171875, 52.625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 16.0, 13.0, 17.0, 17.0, 29.0, 39.0, 43.0, 73.0, 107.0, 155.0, 434.0, 1715.0, 8807.0, 339904.0, 2779294.0, 11713.0, 2169.0, 508.0, 195.0, 107.0, 67.0, 59.0, 43.0, 32.0, 33.0, 18.0, 14.0, 14.0, 21.0, 12.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-86.5, -83.884765625, -81.26953125, -78.654296875, -76.0390625, -73.423828125, -70.80859375, -68.193359375, -65.578125, -62.962890625, -60.34765625, -57.732421875, -55.1171875, -52.501953125, -49.88671875, -47.271484375, -44.65625, -42.041015625, -39.42578125, -36.810546875, -34.1953125, -31.580078125, -28.96484375, -26.349609375, -23.734375, -21.119140625, -18.50390625, -15.888671875, -13.2734375, -10.658203125, -8.04296875, -5.427734375, -2.8125, -0.197265625, 2.41796875, 5.033203125, 7.6484375, 10.263671875, 12.87890625, 15.494140625, 18.109375, 20.724609375, 23.33984375, 25.955078125, 28.5703125, 31.185546875, 33.80078125, 36.416015625, 39.03125, 41.646484375, 44.26171875, 46.876953125, 49.4921875, 52.107421875, 54.72265625, 57.337890625, 59.953125, 62.568359375, 65.18359375, 67.798828125, 70.4140625, 73.029296875, 75.64453125, 78.259765625, 80.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 19.0, 228.0, 602.0, 151.0, 15.0, 0.0, 1.0, 0.0, 1.0], "bins": [-409.54376220703125, -402.4053955078125, -395.26702880859375, -388.128662109375, -380.99029541015625, -373.8519287109375, -366.71356201171875, -359.5751953125, -352.43682861328125, -345.2984619140625, -338.16009521484375, -331.021728515625, -323.88336181640625, -316.7449951171875, -309.60662841796875, -302.46826171875, -295.3298645019531, -288.1914978027344, -281.0531311035156, -273.9147644042969, -266.7763977050781, -259.6380310058594, -252.49964904785156, -245.3612823486328, -238.22291564941406, -231.0845489501953, -223.94618225097656, -216.8078155517578, -209.66943359375, -202.53106689453125, -195.3927001953125, -188.25433349609375, -181.115966796875, -173.97760009765625, -166.8392333984375, -159.70086669921875, -152.5625, -145.42413330078125, -138.28575134277344, -131.1473846435547, -124.00901794433594, -116.87065124511719, -109.73228454589844, -102.59391021728516, -95.4555435180664, -88.31717681884766, -81.17880249023438, -74.04043579101562, -66.90206909179688, -59.763702392578125, -52.62533187866211, -45.486961364746094, -38.348594665527344, -31.210227966308594, -24.071857452392578, -16.933486938476562, -9.795124053955078, -2.6567554473876953, 4.4816131591796875, 11.61998176574707, 18.758350372314453, 25.896717071533203, 33.03508758544922, 40.173458099365234, 47.311824798583984]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 8.0, 4.0, 7.0, 15.0, 8.0, 9.0, 12.0, 17.0, 16.0, 25.0, 19.0, 31.0, 26.0, 30.0, 27.0, 38.0, 42.0, 36.0, 47.0, 52.0, 54.0, 52.0, 34.0, 44.0, 39.0, 39.0, 36.0, 24.0, 35.0, 22.0, 20.0, 18.0, 16.0, 25.0, 13.0, 17.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-114.6417236328125, -111.21849822998047, -107.79527282714844, -104.37203979492188, -100.94881439208984, -97.52558898925781, -94.10236358642578, -90.67913818359375, -87.25590515136719, -83.83267974853516, -80.40945434570312, -76.98622131347656, -73.56299591064453, -70.1397705078125, -66.71654510498047, -63.29331970214844, -59.870094299316406, -56.446868896484375, -53.02363967895508, -49.60041427612305, -46.17718505859375, -42.75395965576172, -39.33073425292969, -35.907508850097656, -32.48427963256836, -29.061052322387695, -25.63782501220703, -22.214599609375, -18.791372299194336, -15.368144989013672, -11.94491958618164, -8.521692276000977, -5.098457336425781, -1.6752305030822754, 1.7479963302612305, 5.171222686767578, 8.594449996948242, 12.017677307128906, 15.440902709960938, 18.8641300201416, 22.287357330322266, 25.71058464050293, 29.133811950683594, 32.557037353515625, 35.980262756347656, 39.40349197387695, 42.826717376708984, 46.24994659423828, 49.67317199707031, 53.096397399902344, 56.51962661743164, 59.94285202026367, 63.36608123779297, 66.789306640625, 70.21253204345703, 73.63575744628906, 77.05899047851562, 80.48221588134766, 83.90544128417969, 87.32867431640625, 90.75189971923828, 94.17512512207031, 97.59835052490234, 101.02157592773438, 104.4448013305664]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 9.0, 19.0, 18.0, 25.0, 24.0, 22.0, 39.0, 29.0, 33.0, 30.0, 34.0, 32.0, 51.0, 44.0, 42.0, 46.0, 53.0, 42.0, 40.0, 33.0, 46.0, 36.0, 29.0, 38.0, 35.0, 29.0, 22.0, 15.0, 16.0, 7.0, 11.0, 5.0, 8.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.25, -15.7802734375, -15.310546875, -14.8408203125, -14.37109375, -13.9013671875, -13.431640625, -12.9619140625, -12.4921875, -12.0224609375, -11.552734375, -11.0830078125, -10.61328125, -10.1435546875, -9.673828125, -9.2041015625, -8.734375, -8.2646484375, -7.794921875, -7.3251953125, -6.85546875, -6.3857421875, -5.916015625, -5.4462890625, -4.9765625, -4.5068359375, -4.037109375, -3.5673828125, -3.09765625, -2.6279296875, -2.158203125, -1.6884765625, -1.21875, -0.7490234375, -0.279296875, 0.1904296875, 0.66015625, 1.1298828125, 1.599609375, 2.0693359375, 2.5390625, 3.0087890625, 3.478515625, 3.9482421875, 4.41796875, 4.8876953125, 5.357421875, 5.8271484375, 6.296875, 6.7666015625, 7.236328125, 7.7060546875, 8.17578125, 8.6455078125, 9.115234375, 9.5849609375, 10.0546875, 10.5244140625, 10.994140625, 11.4638671875, 11.93359375, 12.4033203125, 12.873046875, 13.3427734375, 13.8125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 2.0, 8.0, 12.0, 22.0, 26.0, 35.0, 39.0, 79.0, 126.0, 196.0, 348.0, 666.0, 1457.0, 3202.0, 7336.0, 18503.0, 62129.0, 600904.0, 3030853.0, 391512.0, 49195.0, 15962.0, 6419.0, 2653.0, 1208.0, 554.0, 321.0, 195.0, 105.0, 73.0, 38.0, 26.0, 12.0, 18.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.4375, -34.407958984375, -33.37841796875, -32.348876953125, -31.3193359375, -30.289794921875, -29.26025390625, -28.230712890625, -27.201171875, -26.171630859375, -25.14208984375, -24.112548828125, -23.0830078125, -22.053466796875, -21.02392578125, -19.994384765625, -18.96484375, -17.935302734375, -16.90576171875, -15.876220703125, -14.8466796875, -13.817138671875, -12.78759765625, -11.758056640625, -10.728515625, -9.698974609375, -8.66943359375, -7.639892578125, -6.6103515625, -5.580810546875, -4.55126953125, -3.521728515625, -2.4921875, -1.462646484375, -0.43310546875, 0.596435546875, 1.6259765625, 2.655517578125, 3.68505859375, 4.714599609375, 5.744140625, 6.773681640625, 7.80322265625, 8.832763671875, 9.8623046875, 10.891845703125, 11.92138671875, 12.950927734375, 13.98046875, 15.010009765625, 16.03955078125, 17.069091796875, 18.0986328125, 19.128173828125, 20.15771484375, 21.187255859375, 22.216796875, 23.246337890625, 24.27587890625, 25.305419921875, 26.3349609375, 27.364501953125, 28.39404296875, 29.423583984375, 30.453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 19.0, 24.0, 44.0, 58.0, 87.0, 179.0, 357.0, 914.0, 1239.0, 578.0, 265.0, 121.0, 56.0, 28.0, 38.0, 14.0, 6.0, 12.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -51.07080078125, -49.7353515625, -48.39990234375, -47.064453125, -45.72900390625, -44.3935546875, -43.05810546875, -41.72265625, -40.38720703125, -39.0517578125, -37.71630859375, -36.380859375, -35.04541015625, -33.7099609375, -32.37451171875, -31.0390625, -29.70361328125, -28.3681640625, -27.03271484375, -25.697265625, -24.36181640625, -23.0263671875, -21.69091796875, -20.35546875, -19.02001953125, -17.6845703125, -16.34912109375, -15.013671875, -13.67822265625, -12.3427734375, -11.00732421875, -9.671875, -8.33642578125, -7.0009765625, -5.66552734375, -4.330078125, -2.99462890625, -1.6591796875, -0.32373046875, 1.01171875, 2.34716796875, 3.6826171875, 5.01806640625, 6.353515625, 7.68896484375, 9.0244140625, 10.35986328125, 11.6953125, 13.03076171875, 14.3662109375, 15.70166015625, 17.037109375, 18.37255859375, 19.7080078125, 21.04345703125, 22.37890625, 23.71435546875, 25.0498046875, 26.38525390625, 27.720703125, 29.05615234375, 30.3916015625, 31.72705078125, 33.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 10.0, 16.0, 28.0, 67.0, 96.0, 263.0, 568.0, 2158.0, 16275.0, 559943.0, 3571722.0, 38117.0, 3546.0, 806.0, 332.0, 142.0, 72.0, 37.0, 38.0, 15.0, 4.0, 9.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.8125, -66.5126953125, -63.212890625, -59.9130859375, -56.61328125, -53.3134765625, -50.013671875, -46.7138671875, -43.4140625, -40.1142578125, -36.814453125, -33.5146484375, -30.21484375, -26.9150390625, -23.615234375, -20.3154296875, -17.015625, -13.7158203125, -10.416015625, -7.1162109375, -3.81640625, -0.5166015625, 2.783203125, 6.0830078125, 9.3828125, 12.6826171875, 15.982421875, 19.2822265625, 22.58203125, 25.8818359375, 29.181640625, 32.4814453125, 35.78125, 39.0810546875, 42.380859375, 45.6806640625, 48.98046875, 52.2802734375, 55.580078125, 58.8798828125, 62.1796875, 65.4794921875, 68.779296875, 72.0791015625, 75.37890625, 78.6787109375, 81.978515625, 85.2783203125, 88.578125, 91.8779296875, 95.177734375, 98.4775390625, 101.77734375, 105.0771484375, 108.376953125, 111.6767578125, 114.9765625, 118.2763671875, 121.576171875, 124.8759765625, 128.17578125, 131.4755859375, 134.775390625, 138.0751953125, 141.375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 68.0, 183.0, 338.0, 259.0, 104.0, 23.0, 11.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5100860595703, -227.67068481445312, -218.83128356933594, -209.99188232421875, -201.15248107910156, -192.31307983398438, -183.47369384765625, -174.63427734375, -165.79489135742188, -156.9554901123047, -148.1160888671875, -139.2766876220703, -130.43728637695312, -121.59788513183594, -112.75849151611328, -103.9190902709961, -95.07968139648438, -86.24028015136719, -77.40087890625, -68.56147766113281, -59.72208023071289, -50.8826789855957, -42.04328155517578, -33.203880310058594, -24.364479064941406, -15.525078773498535, -6.685678482055664, 2.1537208557128906, 10.993122100830078, 19.832523345947266, 28.671920776367188, 37.511322021484375, 46.350738525390625, 55.19013977050781, 64.029541015625, 72.86894226074219, 81.70834350585938, 90.54774475097656, 99.38713836669922, 108.2265396118164, 117.0659408569336, 125.90534210205078, 134.74473571777344, 143.58413696289062, 152.4235382080078, 161.262939453125, 170.1023406982422, 178.94174194335938, 187.78114318847656, 196.62054443359375, 205.45994567871094, 214.29934692382812, 223.1387481689453, 231.9781494140625, 240.81753540039062, 249.65695190429688, 258.496337890625, 267.3357238769531, 276.1751403808594, 285.0145263671875, 293.85394287109375, 302.6933288574219, 311.5327453613281, 320.37213134765625, 329.2115478515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 7.0, 15.0, 16.0, 24.0, 23.0, 29.0, 32.0, 32.0, 26.0, 39.0, 33.0, 45.0, 36.0, 44.0, 64.0, 47.0, 53.0, 44.0, 44.0, 46.0, 42.0, 38.0, 27.0, 23.0, 21.0, 23.0, 13.0, 9.0, 13.0, 11.0, 13.0, 6.0, 8.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.86015319824219, -84.16903686523438, -81.47792053222656, -78.78680419921875, -76.09568786621094, -73.40457153320312, -70.71345520019531, -68.02234649658203, -65.33123016357422, -62.640113830566406, -59.948997497558594, -57.25788116455078, -54.566768646240234, -51.87565231323242, -49.18453598022461, -46.49342346191406, -43.802303314208984, -41.11118698120117, -38.42007064819336, -35.72895812988281, -33.037841796875, -30.346725463867188, -27.655609130859375, -24.964494705200195, -22.273378372192383, -19.58226203918457, -16.89114761352539, -14.200031280517578, -11.508915901184082, -8.817800521850586, -6.126684188842773, -3.4355697631835938, -0.7444534301757812, 1.946662187576294, 4.637777805328369, 7.328893661499023, 10.02000904083252, 12.711124420166016, 15.402240753173828, 18.093355178833008, 20.78447151184082, 23.475587844848633, 26.166702270507812, 28.857818603515625, 31.548934936523438, 34.24005126953125, 36.93116760253906, 39.62228012084961, 42.31339645385742, 45.004512786865234, 47.69562911987305, 50.386741638183594, 53.077857971191406, 55.76897430419922, 58.46009063720703, 61.151206970214844, 63.842323303222656, 66.53343963623047, 69.22455596923828, 71.9156723022461, 74.6067886352539, 77.29789733886719, 79.989013671875, 82.68013000488281, 85.37124633789062]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 14.0, 26.0, 34.0, 49.0, 81.0, 90.0, 144.0, 205.0, 301.0, 392.0, 578.0, 774.0, 1100.0, 1631.0, 2299.0, 3372.0, 4837.0, 7355.0, 10752.0, 15642.0, 22850.0, 34038.0, 49726.0, 72827.0, 108253.0, 162610.0, 178455.0, 118871.0, 79991.0, 54474.0, 37246.0, 25333.0, 17239.0, 11485.0, 7981.0, 5412.0, 3644.0, 2532.0, 1692.0, 1283.0, 881.0, 677.0, 424.0, 299.0, 194.0, 137.0, 103.0, 62.0, 52.0, 28.0, 35.0, 17.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0], "bins": [-0.247802734375, -0.24008750915527344, -0.23237228393554688, -0.2246570587158203, -0.21694183349609375, -0.2092266082763672, -0.20151138305664062, -0.19379615783691406, -0.1860809326171875, -0.17836570739746094, -0.17065048217773438, -0.1629352569580078, -0.15522003173828125, -0.1475048065185547, -0.13978958129882812, -0.13207435607910156, -0.124359130859375, -0.11664390563964844, -0.10892868041992188, -0.10121345520019531, -0.09349822998046875, -0.08578300476074219, -0.07806777954101562, -0.07035255432128906, -0.0626373291015625, -0.05492210388183594, -0.047206878662109375, -0.03949165344238281, -0.03177642822265625, -0.024061203002929688, -0.016345977783203125, -0.008630752563476562, -0.00091552734375, 0.0067996978759765625, 0.014514923095703125, 0.022230148315429688, 0.02994537353515625, 0.03766059875488281, 0.045375823974609375, 0.05309104919433594, 0.0608062744140625, 0.06852149963378906, 0.07623672485351562, 0.08395195007324219, 0.09166717529296875, 0.09938240051269531, 0.10709762573242188, 0.11481285095214844, 0.122528076171875, 0.13024330139160156, 0.13795852661132812, 0.1456737518310547, 0.15338897705078125, 0.1611042022705078, 0.16881942749023438, 0.17653465270996094, 0.1842498779296875, 0.19196510314941406, 0.19968032836914062, 0.2073955535888672, 0.21511077880859375, 0.2228260040283203, 0.23054122924804688, 0.23825645446777344, 0.2459716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 11.0, 8.0, 11.0, 12.0, 17.0, 25.0, 20.0, 23.0, 31.0, 26.0, 32.0, 46.0, 38.0, 48.0, 51.0, 37.0, 34.0, 1070.0, 41.0, 54.0, 40.0, 37.0, 40.0, 42.0, 33.0, 31.0, 21.0, 31.0, 19.0, 13.0, 21.0, 8.0, 12.0, 7.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.1328125, -13.7530517578125, -13.373291015625, -12.9935302734375, -12.61376953125, -12.2340087890625, -11.854248046875, -11.4744873046875, -11.0947265625, -10.7149658203125, -10.335205078125, -9.9554443359375, -9.57568359375, -9.1959228515625, -8.816162109375, -8.4364013671875, -8.056640625, -7.6768798828125, -7.297119140625, -6.9173583984375, -6.53759765625, -6.1578369140625, -5.778076171875, -5.3983154296875, -5.0185546875, -4.6387939453125, -4.259033203125, -3.8792724609375, -3.49951171875, -3.1197509765625, -2.739990234375, -2.3602294921875, -1.98046875, -1.6007080078125, -1.220947265625, -0.8411865234375, -0.46142578125, -0.0816650390625, 0.298095703125, 0.6778564453125, 1.0576171875, 1.4373779296875, 1.817138671875, 2.1968994140625, 2.57666015625, 2.9564208984375, 3.336181640625, 3.7159423828125, 4.095703125, 4.4754638671875, 4.855224609375, 5.2349853515625, 5.61474609375, 5.9945068359375, 6.374267578125, 6.7540283203125, 7.1337890625, 7.5135498046875, 7.893310546875, 8.2730712890625, 8.65283203125, 9.0325927734375, 9.412353515625, 9.7921142578125, 10.171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 83.0, 130.0, 238.0, 346.0, 573.0, 1062.0, 1704.0, 2788.0, 4731.0, 7675.0, 13309.0, 22927.0, 40266.0, 73250.0, 143613.0, 1320608.0, 219563.0, 109297.0, 57836.0, 32055.0, 18261.0, 10751.0, 6283.0, 3841.0, 2210.0, 1425.0, 859.0, 492.0, 319.0, 182.0, 101.0, 75.0, 51.0, 30.0, 18.0, 16.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2265625, -0.21965599060058594, -0.21274948120117188, -0.2058429718017578, -0.19893646240234375, -0.1920299530029297, -0.18512344360351562, -0.17821693420410156, -0.1713104248046875, -0.16440391540527344, -0.15749740600585938, -0.1505908966064453, -0.14368438720703125, -0.1367778778076172, -0.12987136840820312, -0.12296485900878906, -0.116058349609375, -0.10915184020996094, -0.10224533081054688, -0.09533882141113281, -0.08843231201171875, -0.08152580261230469, -0.07461929321289062, -0.06771278381347656, -0.0608062744140625, -0.05389976501464844, -0.046993255615234375, -0.04008674621582031, -0.03318023681640625, -0.026273727416992188, -0.019367218017578125, -0.012460708618164062, -0.00555419921875, 0.0013523101806640625, 0.008258819580078125, 0.015165328979492188, 0.02207183837890625, 0.028978347778320312, 0.035884857177734375, 0.04279136657714844, 0.0496978759765625, 0.05660438537597656, 0.06351089477539062, 0.07041740417480469, 0.07732391357421875, 0.08423042297363281, 0.09113693237304688, 0.09804344177246094, 0.104949951171875, 0.11185646057128906, 0.11876296997070312, 0.1256694793701172, 0.13257598876953125, 0.1394824981689453, 0.14638900756835938, 0.15329551696777344, 0.1602020263671875, 0.16710853576660156, 0.17401504516601562, 0.1809215545654297, 0.18782806396484375, 0.1947345733642578, 0.20164108276367188, 0.20854759216308594, 0.2154541015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 14.0, 14.0, 6.0, 20.0, 11.0, 20.0, 16.0, 17.0, 25.0, 30.0, 35.0, 44.0, 26.0, 27.0, 45.0, 42.0, 58.0, 51.0, 53.0, 46.0, 39.0, 52.0, 36.0, 30.0, 24.0, 30.0, 28.0, 18.0, 22.0, 21.0, 10.0, 18.0, 16.0, 7.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003867149353027344, -0.00037195533514022827, -0.00035719573497772217, -0.00034243613481521606, -0.00032767653465270996, -0.00031291693449020386, -0.00029815733432769775, -0.00028339773416519165, -0.00026863813400268555, -0.00025387853384017944, -0.00023911893367767334, -0.00022435933351516724, -0.00020959973335266113, -0.00019484013319015503, -0.00018008053302764893, -0.00016532093286514282, -0.00015056133270263672, -0.00013580173254013062, -0.00012104213237762451, -0.00010628253221511841, -9.15229320526123e-05, -7.67633318901062e-05, -6.20037317276001e-05, -4.7244131565093994e-05, -3.248453140258789e-05, -1.7724931240081787e-05, -2.9653310775756836e-06, 1.179426908493042e-05, 2.6553869247436523e-05, 4.131346940994263e-05, 5.607306957244873e-05, 7.083266973495483e-05, 8.559226989746094e-05, 0.00010035187005996704, 0.00011511147022247314, 0.00012987107038497925, 0.00014463067054748535, 0.00015939027070999146, 0.00017414987087249756, 0.00018890947103500366, 0.00020366907119750977, 0.00021842867136001587, 0.00023318827152252197, 0.0002479478716850281, 0.0002627074718475342, 0.0002774670720100403, 0.0002922266721725464, 0.0003069862723350525, 0.0003217458724975586, 0.0003365054726600647, 0.0003512650728225708, 0.0003660246729850769, 0.000380784273147583, 0.0003955438733100891, 0.0004103034734725952, 0.0004250630736351013, 0.0004398226737976074, 0.0004545822739601135, 0.00046934187412261963, 0.00048410147428512573, 0.0004988610744476318, 0.0005136206746101379, 0.000528380274772644, 0.0005431398749351501, 0.0005578994750976562]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 11.0, 15.0, 18.0, 22.0, 17.0, 26.0, 34.0, 33.0, 41.0, 68.0, 102.0, 181.0, 303.0, 863.0, 20004.0, 1019707.0, 5481.0, 678.0, 315.0, 130.0, 87.0, 69.0, 68.0, 40.0, 43.0, 28.0, 15.0, 21.0, 15.0, 14.0, 15.0, 6.0, 10.0, 16.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.0124359130859375, -0.01210319995880127, -0.011770486831665039, -0.011437773704528809, -0.011105060577392578, -0.010772347450256348, -0.010439634323120117, -0.010106921195983887, -0.009774208068847656, -0.009441494941711426, -0.009108781814575195, -0.008776068687438965, -0.008443355560302734, -0.008110642433166504, -0.0077779293060302734, -0.007445216178894043, -0.0071125030517578125, -0.006779789924621582, -0.0064470767974853516, -0.006114363670349121, -0.005781650543212891, -0.00544893741607666, -0.00511622428894043, -0.004783511161804199, -0.004450798034667969, -0.004118084907531738, -0.003785371780395508, -0.0034526586532592773, -0.003119945526123047, -0.0027872323989868164, -0.002454519271850586, -0.0021218061447143555, -0.001789093017578125, -0.0014563798904418945, -0.001123666763305664, -0.0007909536361694336, -0.0004582405090332031, -0.00012552738189697266, 0.0002071857452392578, 0.0005398988723754883, 0.0008726119995117188, 0.0012053251266479492, 0.0015380382537841797, 0.0018707513809204102, 0.0022034645080566406, 0.002536177635192871, 0.0028688907623291016, 0.003201603889465332, 0.0035343170166015625, 0.003867030143737793, 0.0041997432708740234, 0.004532456398010254, 0.004865169525146484, 0.005197882652282715, 0.005530595779418945, 0.005863308906555176, 0.006196022033691406, 0.006528735160827637, 0.006861448287963867, 0.007194161415100098, 0.007526874542236328, 0.007859587669372559, 0.008192300796508789, 0.00852501392364502, 0.00885772705078125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 371.0, 641.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011258742772042751, -0.011014152318239212, -0.010769560933113098, -0.010524969547986984, -0.010280379094183445, -0.010035788640379906, -0.009791197255253792, -0.009546605870127678, -0.009302015416324139, -0.0090574249625206, -0.008812833577394485, -0.008568242192268372, -0.008323651738464832, -0.008079061284661293, -0.00783446989953518, -0.0075898789800703526, -0.007345288060605526, -0.007100697141140699, -0.006856106221675873, -0.006611515302211046, -0.00636692438274622, -0.006122333463281393, -0.0058777425438165665, -0.00563315162435174, -0.005388560704886913, -0.005143969785422087, -0.00489937886595726, -0.0046547879464924335, -0.004410197027027607, -0.00416560610756278, -0.003921015188097954, -0.003676424268633127, -0.0034318342804908752, -0.0031872433610260487, -0.002942652441561222, -0.0026980615220963955, -0.002453470602631569, -0.0022088796831667423, -0.0019642887637019157, -0.0017196978442370892, -0.0014751069247722626, -0.001230516005307436, -0.0009859250858426094, -0.0007413341663777828, -0.0004967432469129562, -0.00025215232744812965, -7.56140798330307e-06, 0.00023702951148152351, 0.0004816204309463501, 0.0007262113504111767, 0.0009708022698760033, 0.0012153931893408298, 0.0014599841088056564, 0.001704575028270483, 0.0019491659477353096, 0.002193756867200136, 0.0024383477866649628, 0.0026829387061297894, 0.002927529625594616, 0.0031721205450594425, 0.003416711464524269, 0.0036613023839890957, 0.0039058933034539223, 0.004150484222918749, 0.0043950751423835754]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 17.0, 32.0, 35.0, 48.0, 63.0, 81.0, 103.0, 116.0, 107.0, 86.0, 84.0, 74.0, 44.0, 36.0, 28.0, 22.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000894010066986084, -0.00086224265396595, -0.000830475240945816, -0.0007987078279256821, -0.0007669404149055481, -0.0007351730018854141, -0.0007034055888652802, -0.0006716381758451462, -0.0006398707628250122, -0.0006081033498048782, -0.0005763359367847443, -0.0005445685237646103, -0.0005128011107444763, -0.00048103369772434235, -0.0004492662847042084, -0.0004174988716840744, -0.00038573145866394043, -0.00035396404564380646, -0.0003221966326236725, -0.0002904292196035385, -0.00025866180658340454, -0.00022689439356327057, -0.0001951269805431366, -0.00016335956752300262, -0.00013159215450286865, -9.982474148273468e-05, -6.805732846260071e-05, -3.6289915442466736e-05, -4.522502422332764e-06, 2.724491059780121e-05, 5.901232361793518e-05, 9.077973663806915e-05, 0.00012254714965820312, 0.0001543145626783371, 0.00018608197569847107, 0.00021784938871860504, 0.000249616801738739, 0.000281384214758873, 0.00031315162777900696, 0.00034491904079914093, 0.0003766864538192749, 0.0004084538668394089, 0.00044022127985954285, 0.0004719886928796768, 0.0005037561058998108, 0.0005355235189199448, 0.0005672909319400787, 0.0005990583449602127, 0.0006308257579803467, 0.0006625931710004807, 0.0006943605840206146, 0.0007261279970407486, 0.0007578954100608826, 0.0007896628230810165, 0.0008214302361011505, 0.0008531976491212845, 0.0008849650621414185, 0.0009167324751615524, 0.0009484998881816864, 0.0009802673012018204, 0.0010120347142219543, 0.0010438021272420883, 0.0010755695402622223, 0.0011073369532823563, 0.0011391043663024902]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 14.0, 21.0, 16.0, 32.0, 31.0, 53.0, 78.0, 100.0, 136.0, 187.0, 293.0, 444.0, 683.0, 1071.0, 1834.0, 3074.0, 5362.0, 9188.0, 17119.0, 46504.0, 736559.0, 168389.0, 27006.0, 12746.0, 7052.0, 4042.0, 2417.0, 1438.0, 879.0, 542.0, 387.0, 227.0, 150.0, 117.0, 72.0, 67.0, 52.0, 31.0, 20.0, 21.0, 19.0, 16.0, 15.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.234375, -27.372802734375, -26.51123046875, -25.649658203125, -24.7880859375, -23.926513671875, -23.06494140625, -22.203369140625, -21.341796875, -20.480224609375, -19.61865234375, -18.757080078125, -17.8955078125, -17.033935546875, -16.17236328125, -15.310791015625, -14.44921875, -13.587646484375, -12.72607421875, -11.864501953125, -11.0029296875, -10.141357421875, -9.27978515625, -8.418212890625, -7.556640625, -6.695068359375, -5.83349609375, -4.971923828125, -4.1103515625, -3.248779296875, -2.38720703125, -1.525634765625, -0.6640625, 0.197509765625, 1.05908203125, 1.920654296875, 2.7822265625, 3.643798828125, 4.50537109375, 5.366943359375, 6.228515625, 7.090087890625, 7.95166015625, 8.813232421875, 9.6748046875, 10.536376953125, 11.39794921875, 12.259521484375, 13.12109375, 13.982666015625, 14.84423828125, 15.705810546875, 16.5673828125, 17.428955078125, 18.29052734375, 19.152099609375, 20.013671875, 20.875244140625, 21.73681640625, 22.598388671875, 23.4599609375, 24.321533203125, 25.18310546875, 26.044677734375, 26.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 4.0, 9.0, 17.0, 19.0, 21.0, 31.0, 24.0, 29.0, 38.0, 35.0, 44.0, 36.0, 46.0, 67.0, 103.0, 1743.0, 264.0, 80.0, 59.0, 43.0, 46.0, 37.0, 35.0, 28.0, 28.0, 18.0, 23.0, 10.0, 15.0, 16.0, 9.0, 11.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.04638671875, -34.7490234375, -33.45166015625, -32.154296875, -30.85693359375, -29.5595703125, -28.26220703125, -26.96484375, -25.66748046875, -24.3701171875, -23.07275390625, -21.775390625, -20.47802734375, -19.1806640625, -17.88330078125, -16.5859375, -15.28857421875, -13.9912109375, -12.69384765625, -11.396484375, -10.09912109375, -8.8017578125, -7.50439453125, -6.20703125, -4.90966796875, -3.6123046875, -2.31494140625, -1.017578125, 0.27978515625, 1.5771484375, 2.87451171875, 4.171875, 5.46923828125, 6.7666015625, 8.06396484375, 9.361328125, 10.65869140625, 11.9560546875, 13.25341796875, 14.55078125, 15.84814453125, 17.1455078125, 18.44287109375, 19.740234375, 21.03759765625, 22.3349609375, 23.63232421875, 24.9296875, 26.22705078125, 27.5244140625, 28.82177734375, 30.119140625, 31.41650390625, 32.7138671875, 34.01123046875, 35.30859375, 36.60595703125, 37.9033203125, 39.20068359375, 40.498046875, 41.79541015625, 43.0927734375, 44.39013671875, 45.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 9.0, 14.0, 14.0, 22.0, 16.0, 29.0, 22.0, 47.0, 83.0, 103.0, 179.0, 376.0, 1167.0, 4473.0, 25157.0, 2948441.0, 149995.0, 11471.0, 2518.0, 724.0, 316.0, 149.0, 94.0, 56.0, 41.0, 40.0, 26.0, 29.0, 19.0, 10.0, 9.0, 8.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -78.5302734375, -76.060546875, -73.5908203125, -71.12109375, -68.6513671875, -66.181640625, -63.7119140625, -61.2421875, -58.7724609375, -56.302734375, -53.8330078125, -51.36328125, -48.8935546875, -46.423828125, -43.9541015625, -41.484375, -39.0146484375, -36.544921875, -34.0751953125, -31.60546875, -29.1357421875, -26.666015625, -24.1962890625, -21.7265625, -19.2568359375, -16.787109375, -14.3173828125, -11.84765625, -9.3779296875, -6.908203125, -4.4384765625, -1.96875, 0.5009765625, 2.970703125, 5.4404296875, 7.91015625, 10.3798828125, 12.849609375, 15.3193359375, 17.7890625, 20.2587890625, 22.728515625, 25.1982421875, 27.66796875, 30.1376953125, 32.607421875, 35.0771484375, 37.546875, 40.0166015625, 42.486328125, 44.9560546875, 47.42578125, 49.8955078125, 52.365234375, 54.8349609375, 57.3046875, 59.7744140625, 62.244140625, 64.7138671875, 67.18359375, 69.6533203125, 72.123046875, 74.5927734375, 77.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 13.0, 59.0, 187.0, 363.0, 280.0, 71.0, 30.0, 6.0, 0.0, 2.0], "bins": [-248.97499084472656, -244.65927124023438, -240.34356689453125, -236.02784729003906, -231.71212768554688, -227.3964080810547, -223.0806884765625, -218.76498413085938, -214.4492645263672, -210.133544921875, -205.81784057617188, -201.5021209716797, -197.1864013671875, -192.8706817626953, -188.55496215820312, -184.2392578125, -179.9235382080078, -175.60781860351562, -171.2921142578125, -166.9763946533203, -162.66067504882812, -158.34495544433594, -154.02923583984375, -149.71353149414062, -145.39781188964844, -141.08209228515625, -136.76638793945312, -132.45066833496094, -128.13494873046875, -123.81922912597656, -119.5035171508789, -115.18780517578125, -110.87207794189453, -106.55636596679688, -102.24064636230469, -97.9249267578125, -93.60921478271484, -89.29350280761719, -84.977783203125, -80.66206359863281, -76.34635162353516, -72.0306396484375, -67.71492004394531, -63.39920425415039, -59.08348846435547, -54.76777267456055, -50.452056884765625, -46.1363410949707, -41.82062530517578, -37.50490951538086, -33.18919372558594, -28.873477935791016, -24.557762145996094, -20.242046356201172, -15.92633056640625, -11.610614776611328, -7.294897079467773, -2.9791812896728516, 1.3365345001220703, 5.652250289916992, 9.967966079711914, 14.283681869506836, 18.599397659301758, 22.91511344909668, 27.2308292388916]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 10.0, 7.0, 9.0, 19.0, 20.0, 27.0, 21.0, 34.0, 23.0, 26.0, 34.0, 30.0, 26.0, 34.0, 33.0, 34.0, 21.0, 40.0, 46.0, 32.0, 42.0, 37.0, 39.0, 37.0, 42.0, 20.0, 37.0, 20.0, 22.0, 13.0, 25.0, 22.0, 19.0, 19.0, 8.0, 8.0, 7.0, 12.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.50756072998047, -92.47132110595703, -89.43508911132812, -86.39884948730469, -83.36260986328125, -80.32637786865234, -77.2901382446289, -74.25390625, -71.21766662597656, -68.18142700195312, -65.14519500732422, -62.10895538330078, -59.07271957397461, -56.03648376464844, -53.000244140625, -49.96400833129883, -46.927772521972656, -43.891536712646484, -40.85530090332031, -37.819061279296875, -34.7828254699707, -31.74658966064453, -28.710351943969727, -25.674114227294922, -22.63787841796875, -19.601642608642578, -16.565404891967773, -13.529168128967285, -10.492931365966797, -7.456694602966309, -4.42045783996582, -1.3842201232910156, 1.6520156860351562, 4.6882524490356445, 7.724489212036133, 10.760725975036621, 13.79696273803711, 16.83319854736328, 19.869436264038086, 22.90567398071289, 25.941909790039062, 28.978145599365234, 32.014381408691406, 35.050621032714844, 38.086856842041016, 41.12309265136719, 44.159332275390625, 47.1955680847168, 50.23180389404297, 53.26803970336914, 56.30427551269531, 59.34051513671875, 62.37675094604492, 65.4129867553711, 68.44922637939453, 71.48545837402344, 74.52169799804688, 77.55793762207031, 80.59416961669922, 83.63040924072266, 86.66664123535156, 89.702880859375, 92.73912048339844, 95.77536010742188, 98.81159210205078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 7.0, 5.0, 15.0, 14.0, 13.0, 17.0, 20.0, 21.0, 23.0, 25.0, 33.0, 36.0, 43.0, 36.0, 44.0, 39.0, 39.0, 50.0, 43.0, 35.0, 47.0, 31.0, 46.0, 28.0, 34.0, 23.0, 26.0, 30.0, 28.0, 19.0, 16.0, 21.0, 12.0, 12.0, 17.0, 5.0, 5.0, 1.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.5625, -15.1065673828125, -14.650634765625, -14.1947021484375, -13.73876953125, -13.2828369140625, -12.826904296875, -12.3709716796875, -11.9150390625, -11.4591064453125, -11.003173828125, -10.5472412109375, -10.09130859375, -9.6353759765625, -9.179443359375, -8.7235107421875, -8.267578125, -7.8116455078125, -7.355712890625, -6.8997802734375, -6.44384765625, -5.9879150390625, -5.531982421875, -5.0760498046875, -4.6201171875, -4.1641845703125, -3.708251953125, -3.2523193359375, -2.79638671875, -2.3404541015625, -1.884521484375, -1.4285888671875, -0.97265625, -0.5167236328125, -0.060791015625, 0.3951416015625, 0.85107421875, 1.3070068359375, 1.762939453125, 2.2188720703125, 2.6748046875, 3.1307373046875, 3.586669921875, 4.0426025390625, 4.49853515625, 4.9544677734375, 5.410400390625, 5.8663330078125, 6.322265625, 6.7781982421875, 7.234130859375, 7.6900634765625, 8.14599609375, 8.6019287109375, 9.057861328125, 9.5137939453125, 9.9697265625, 10.4256591796875, 10.881591796875, 11.3375244140625, 11.79345703125, 12.2493896484375, 12.705322265625, 13.1612548828125, 13.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 11.0, 25.0, 23.0, 56.0, 88.0, 106.0, 184.0, 233.0, 360.0, 572.0, 912.0, 1450.0, 2511.0, 4019.0, 7185.0, 13519.0, 28219.0, 84484.0, 560835.0, 2619622.0, 704915.0, 100268.0, 31359.0, 14406.0, 7567.0, 4508.0, 2574.0, 1593.0, 988.0, 589.0, 365.0, 250.0, 145.0, 102.0, 59.0, 45.0, 32.0, 24.0, 10.0, 10.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.65625, -26.83203125, -26.0078125, -25.18359375, -24.359375, -23.53515625, -22.7109375, -21.88671875, -21.0625, -20.23828125, -19.4140625, -18.58984375, -17.765625, -16.94140625, -16.1171875, -15.29296875, -14.46875, -13.64453125, -12.8203125, -11.99609375, -11.171875, -10.34765625, -9.5234375, -8.69921875, -7.875, -7.05078125, -6.2265625, -5.40234375, -4.578125, -3.75390625, -2.9296875, -2.10546875, -1.28125, -0.45703125, 0.3671875, 1.19140625, 2.015625, 2.83984375, 3.6640625, 4.48828125, 5.3125, 6.13671875, 6.9609375, 7.78515625, 8.609375, 9.43359375, 10.2578125, 11.08203125, 11.90625, 12.73046875, 13.5546875, 14.37890625, 15.203125, 16.02734375, 16.8515625, 17.67578125, 18.5, 19.32421875, 20.1484375, 20.97265625, 21.796875, 22.62109375, 23.4453125, 24.26953125, 25.09375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 11.0, 10.0, 14.0, 10.0, 16.0, 26.0, 46.0, 50.0, 76.0, 124.0, 160.0, 316.0, 633.0, 957.0, 694.0, 372.0, 176.0, 109.0, 80.0, 55.0, 40.0, 20.0, 21.0, 14.0, 19.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.98876953125, -34.9775390625, -33.96630859375, -32.955078125, -31.94384765625, -30.9326171875, -29.92138671875, -28.91015625, -27.89892578125, -26.8876953125, -25.87646484375, -24.865234375, -23.85400390625, -22.8427734375, -21.83154296875, -20.8203125, -19.80908203125, -18.7978515625, -17.78662109375, -16.775390625, -15.76416015625, -14.7529296875, -13.74169921875, -12.73046875, -11.71923828125, -10.7080078125, -9.69677734375, -8.685546875, -7.67431640625, -6.6630859375, -5.65185546875, -4.640625, -3.62939453125, -2.6181640625, -1.60693359375, -0.595703125, 0.41552734375, 1.4267578125, 2.43798828125, 3.44921875, 4.46044921875, 5.4716796875, 6.48291015625, 7.494140625, 8.50537109375, 9.5166015625, 10.52783203125, 11.5390625, 12.55029296875, 13.5615234375, 14.57275390625, 15.583984375, 16.59521484375, 17.6064453125, 18.61767578125, 19.62890625, 20.64013671875, 21.6513671875, 22.66259765625, 23.673828125, 24.68505859375, 25.6962890625, 26.70751953125, 27.71875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 13.0, 16.0, 19.0, 19.0, 35.0, 58.0, 103.0, 171.0, 317.0, 790.0, 2730.0, 13124.0, 99106.0, 3537007.0, 497216.0, 35176.0, 5812.0, 1429.0, 522.0, 244.0, 134.0, 91.0, 43.0, 26.0, 20.0, 14.0, 16.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.4375, -62.9921875, -60.546875, -58.1015625, -55.65625, -53.2109375, -50.765625, -48.3203125, -45.875, -43.4296875, -40.984375, -38.5390625, -36.09375, -33.6484375, -31.203125, -28.7578125, -26.3125, -23.8671875, -21.421875, -18.9765625, -16.53125, -14.0859375, -11.640625, -9.1953125, -6.75, -4.3046875, -1.859375, 0.5859375, 3.03125, 5.4765625, 7.921875, 10.3671875, 12.8125, 15.2578125, 17.703125, 20.1484375, 22.59375, 25.0390625, 27.484375, 29.9296875, 32.375, 34.8203125, 37.265625, 39.7109375, 42.15625, 44.6015625, 47.046875, 49.4921875, 51.9375, 54.3828125, 56.828125, 59.2734375, 61.71875, 64.1640625, 66.609375, 69.0546875, 71.5, 73.9453125, 76.390625, 78.8359375, 81.28125, 83.7265625, 86.171875, 88.6171875, 91.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 32.0, 64.0, 168.0, 274.0, 247.0, 149.0, 43.0, 20.0, 8.0, 1.0], "bins": [-459.6931457519531, -451.7401428222656, -443.7871398925781, -435.8341064453125, -427.881103515625, -419.9281005859375, -411.97509765625, -404.0220947265625, -396.0690612792969, -388.1160583496094, -380.1630554199219, -372.21002197265625, -364.25701904296875, -356.30401611328125, -348.35101318359375, -340.39801025390625, -332.44500732421875, -324.49200439453125, -316.53900146484375, -308.5859680175781, -300.6329650878906, -292.6799621582031, -284.7269592285156, -276.7739562988281, -268.8209228515625, -260.867919921875, -252.91490173339844, -244.96189880371094, -237.00888061523438, -229.05587768554688, -221.10287475585938, -213.1498565673828, -205.1968536376953, -197.2438507080078, -189.29083251953125, -181.33782958984375, -173.3848114013672, -165.4318084716797, -157.47879028320312, -149.52578735351562, -141.57278442382812, -133.61978149414062, -125.66676330566406, -117.71376037597656, -109.76074981689453, -101.8077392578125, -93.85472869873047, -85.90171813964844, -77.9487075805664, -69.99569702148438, -62.04269027709961, -54.08967971801758, -46.13667297363281, -38.18366241455078, -30.23065185546875, -22.277645111083984, -14.324634552001953, -6.3716254234313965, 1.5813837051391602, 9.534393310546875, 17.487401962280273, 25.440410614013672, 33.3934211730957, 41.34642791748047, 49.2994384765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 5.0, 7.0, 6.0, 15.0, 16.0, 8.0, 14.0, 17.0, 12.0, 25.0, 19.0, 20.0, 27.0, 36.0, 27.0, 44.0, 44.0, 36.0, 29.0, 35.0, 35.0, 45.0, 42.0, 37.0, 36.0, 37.0, 39.0, 27.0, 34.0, 36.0, 19.0, 21.0, 24.0, 23.0, 17.0, 10.0, 9.0, 15.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.98035430908203, -59.78236389160156, -57.58437728881836, -55.386390686035156, -53.18840026855469, -50.99040985107422, -48.792423248291016, -46.59443664550781, -44.396446228027344, -42.198455810546875, -40.00046920776367, -37.80248260498047, -35.6044921875, -33.40650177001953, -31.208515167236328, -29.010526657104492, -26.812538146972656, -24.61454963684082, -22.416561126708984, -20.21857261657715, -18.020584106445312, -15.822595596313477, -13.62460708618164, -11.426618576049805, -9.228630065917969, -7.030641555786133, -4.832653045654297, -2.634664535522461, -0.436676025390625, 1.761312484741211, 3.959300994873047, 6.157289505004883, 8.355270385742188, 10.553258895874023, 12.75124740600586, 14.949235916137695, 17.14722442626953, 19.345212936401367, 21.543201446533203, 23.74118995666504, 25.939178466796875, 28.13716697692871, 30.335155487060547, 32.53314208984375, 34.73113250732422, 36.92912292480469, 39.12710952758789, 41.325096130371094, 43.52308654785156, 45.72107696533203, 47.919063568115234, 50.11705017089844, 52.315040588378906, 54.513031005859375, 56.71101760864258, 58.90900421142578, 61.10699462890625, 63.30498504638672, 65.50297546386719, 67.70095825195312, 69.8989486694336, 72.09693908691406, 74.294921875, 76.49291229248047, 78.69090270996094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 11.0, 14.0, 18.0, 30.0, 41.0, 62.0, 115.0, 124.0, 197.0, 306.0, 438.0, 763.0, 1102.0, 1712.0, 2750.0, 4217.0, 6936.0, 11561.0, 19547.0, 32750.0, 55292.0, 94128.0, 163121.0, 242546.0, 169810.0, 98035.0, 57296.0, 33903.0, 20146.0, 11893.0, 7337.0, 4472.0, 2816.0, 1733.0, 1166.0, 754.0, 473.0, 297.0, 202.0, 148.0, 104.0, 63.0, 37.0, 40.0, 17.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3288307189941406, -0.31806182861328125, -0.3072929382324219, -0.2965240478515625, -0.2857551574707031, -0.27498626708984375, -0.2642173767089844, -0.253448486328125, -0.24267959594726562, -0.23191070556640625, -0.22114181518554688, -0.2103729248046875, -0.19960403442382812, -0.18883514404296875, -0.17806625366210938, -0.16729736328125, -0.15652847290039062, -0.14575958251953125, -0.13499069213867188, -0.1242218017578125, -0.11345291137695312, -0.10268402099609375, -0.09191513061523438, -0.081146240234375, -0.07037734985351562, -0.05960845947265625, -0.048839569091796875, -0.0380706787109375, -0.027301788330078125, -0.01653289794921875, -0.005764007568359375, 0.0050048828125, 0.015773773193359375, 0.02654266357421875, 0.037311553955078125, 0.0480804443359375, 0.058849334716796875, 0.06961822509765625, 0.08038711547851562, 0.091156005859375, 0.10192489624023438, 0.11269378662109375, 0.12346267700195312, 0.1342315673828125, 0.14500045776367188, 0.15576934814453125, 0.16653823852539062, 0.17730712890625, 0.18807601928710938, 0.19884490966796875, 0.20961380004882812, 0.2203826904296875, 0.23115158081054688, 0.24192047119140625, 0.2526893615722656, 0.263458251953125, 0.2742271423339844, 0.28499603271484375, 0.2957649230957031, 0.3065338134765625, 0.3173027038574219, 0.32807159423828125, 0.3388404846191406, 0.349609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 10.0, 11.0, 7.0, 8.0, 17.0, 18.0, 19.0, 18.0, 24.0, 24.0, 30.0, 25.0, 41.0, 41.0, 33.0, 45.0, 48.0, 41.0, 38.0, 1072.0, 37.0, 33.0, 30.0, 36.0, 44.0, 35.0, 39.0, 22.0, 25.0, 13.0, 16.0, 19.0, 18.0, 15.0, 16.0, 13.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.859375, -9.533447265625, -9.20751953125, -8.881591796875, -8.5556640625, -8.229736328125, -7.90380859375, -7.577880859375, -7.251953125, -6.926025390625, -6.60009765625, -6.274169921875, -5.9482421875, -5.622314453125, -5.29638671875, -4.970458984375, -4.64453125, -4.318603515625, -3.99267578125, -3.666748046875, -3.3408203125, -3.014892578125, -2.68896484375, -2.363037109375, -2.037109375, -1.711181640625, -1.38525390625, -1.059326171875, -0.7333984375, -0.407470703125, -0.08154296875, 0.244384765625, 0.5703125, 0.896240234375, 1.22216796875, 1.548095703125, 1.8740234375, 2.199951171875, 2.52587890625, 2.851806640625, 3.177734375, 3.503662109375, 3.82958984375, 4.155517578125, 4.4814453125, 4.807373046875, 5.13330078125, 5.459228515625, 5.78515625, 6.111083984375, 6.43701171875, 6.762939453125, 7.0888671875, 7.414794921875, 7.74072265625, 8.066650390625, 8.392578125, 8.718505859375, 9.04443359375, 9.370361328125, 9.6962890625, 10.022216796875, 10.34814453125, 10.674072265625, 11.0]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 5.0, 13.0, 13.0, 21.0, 44.0, 60.0, 77.0, 101.0, 141.0, 238.0, 289.0, 391.0, 609.0, 824.0, 1074.0, 1643.0, 2182.0, 3242.0, 4465.0, 6428.0, 9313.0, 13572.0, 20327.0, 30282.0, 46080.0, 70816.0, 112494.0, 178663.0, 1238250.0, 123815.0, 77883.0, 50114.0, 33284.0, 22322.0, 14934.0, 9996.0, 6986.0, 4788.0, 3273.0, 2278.0, 1626.0, 1162.0, 900.0, 608.0, 423.0, 325.0, 219.0, 165.0, 107.0, 98.0, 52.0, 43.0, 22.0, 20.0, 14.0, 11.0, 5.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.143310546875, -0.138702392578125, -0.13409423828125, -0.129486083984375, -0.1248779296875, -0.120269775390625, -0.11566162109375, -0.111053466796875, -0.1064453125, -0.101837158203125, -0.09722900390625, -0.092620849609375, -0.0880126953125, -0.083404541015625, -0.07879638671875, -0.074188232421875, -0.069580078125, -0.064971923828125, -0.06036376953125, -0.055755615234375, -0.0511474609375, -0.046539306640625, -0.04193115234375, -0.037322998046875, -0.03271484375, -0.028106689453125, -0.02349853515625, -0.018890380859375, -0.0142822265625, -0.009674072265625, -0.00506591796875, -0.000457763671875, 0.004150390625, 0.008758544921875, 0.01336669921875, 0.017974853515625, 0.0225830078125, 0.027191162109375, 0.03179931640625, 0.036407470703125, 0.041015625, 0.045623779296875, 0.05023193359375, 0.054840087890625, 0.0594482421875, 0.064056396484375, 0.06866455078125, 0.073272705078125, 0.077880859375, 0.082489013671875, 0.08709716796875, 0.091705322265625, 0.0963134765625, 0.100921630859375, 0.10552978515625, 0.110137939453125, 0.11474609375, 0.119354248046875, 0.12396240234375, 0.128570556640625, 0.1331787109375, 0.137786865234375, 0.14239501953125, 0.147003173828125, 0.151611328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 9.0, 4.0, 5.0, 11.0, 17.0, 13.0, 14.0, 13.0, 20.0, 27.0, 34.0, 43.0, 49.0, 50.0, 55.0, 60.0, 70.0, 66.0, 52.0, 66.0, 48.0, 51.0, 35.0, 36.0, 27.0, 25.0, 21.0, 18.0, 6.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005297660827636719, -0.0005147233605384827, -0.0004996806383132935, -0.00048463791608810425, -0.00046959519386291504, -0.00045455247163772583, -0.0004395097494125366, -0.0004244670271873474, -0.0004094243049621582, -0.000394381582736969, -0.0003793388605117798, -0.0003642961382865906, -0.00034925341606140137, -0.00033421069383621216, -0.00031916797161102295, -0.00030412524938583374, -0.00028908252716064453, -0.0002740398049354553, -0.0002589970827102661, -0.0002439543604850769, -0.0002289116382598877, -0.00021386891603469849, -0.00019882619380950928, -0.00018378347158432007, -0.00016874074935913086, -0.00015369802713394165, -0.00013865530490875244, -0.00012361258268356323, -0.00010856986045837402, -9.352713823318481e-05, -7.84844160079956e-05, -6.34416937828064e-05, -4.839897155761719e-05, -3.335624933242798e-05, -1.831352710723877e-05, -3.2708048820495605e-06, 1.1771917343139648e-05, 2.6814639568328857e-05, 4.1857361793518066e-05, 5.6900084018707275e-05, 7.194280624389648e-05, 8.69855284690857e-05, 0.0001020282506942749, 0.00011707097291946411, 0.00013211369514465332, 0.00014715641736984253, 0.00016219913959503174, 0.00017724186182022095, 0.00019228458404541016, 0.00020732730627059937, 0.00022237002849578857, 0.00023741275072097778, 0.000252455472946167, 0.0002674981951713562, 0.0002825409173965454, 0.0002975836396217346, 0.00031262636184692383, 0.00032766908407211304, 0.00034271180629730225, 0.00035775452852249146, 0.00037279725074768066, 0.0003878399729728699, 0.0004028826951980591, 0.0004179254174232483, 0.0004329681396484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 3.0, 7.0, 9.0, 13.0, 9.0, 21.0, 27.0, 28.0, 34.0, 61.0, 65.0, 125.0, 209.0, 420.0, 1800.0, 981799.0, 62103.0, 870.0, 349.0, 175.0, 100.0, 77.0, 51.0, 45.0, 26.0, 19.0, 14.0, 16.0, 19.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.00938260555267334, -0.00904536247253418, -0.00870811939239502, -0.00837087631225586, -0.0080336332321167, -0.007696390151977539, -0.007359147071838379, -0.007021903991699219, -0.006684660911560059, -0.0063474178314208984, -0.006010174751281738, -0.005672931671142578, -0.005335688591003418, -0.004998445510864258, -0.004661202430725098, -0.0043239593505859375, -0.003986716270446777, -0.003649473190307617, -0.003312230110168457, -0.002974987030029297, -0.0026377439498901367, -0.0023005008697509766, -0.0019632577896118164, -0.0016260147094726562, -0.001288771629333496, -0.0009515285491943359, -0.0006142854690551758, -0.0002770423889160156, 6.020069122314453e-05, 0.0003974437713623047, 0.0007346868515014648, 0.001071929931640625, 0.0014091730117797852, 0.0017464160919189453, 0.0020836591720581055, 0.0024209022521972656, 0.0027581453323364258, 0.003095388412475586, 0.003432631492614746, 0.0037698745727539062, 0.004107117652893066, 0.0044443607330322266, 0.004781603813171387, 0.005118846893310547, 0.005456089973449707, 0.005793333053588867, 0.006130576133728027, 0.0064678192138671875, 0.006805062294006348, 0.007142305374145508, 0.007479548454284668, 0.007816791534423828, 0.008154034614562988, 0.008491277694702148, 0.008828520774841309, 0.009165763854980469, 0.009503006935119629, 0.009840250015258789, 0.01017749309539795, 0.01051473617553711, 0.01085197925567627, 0.01118922233581543, 0.01152646541595459, 0.01186370849609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 912.0, 88.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028254054486751556, -0.0027009393088519573, -0.0025764729361981153, -0.002452006796374917, -0.0023275406565517187, -0.0022030742838978767, -0.0020786081440746784, -0.00195414200425148, -0.00182967574801296, -0.0017052094917744398, -0.0015807433519512415, -0.0014562770957127213, -0.0013318108394742012, -0.0012073446996510029, -0.0010828784434124827, -0.0009584122453816235, -0.0008339460473507643, -0.000709479849319905, -0.0005850136512890458, -0.00046054739505052567, -0.00033608119701966643, -0.0002116149989888072, -8.714874275028706e-05, 3.7317455280572176e-05, 0.0001617836533114314, 0.00028624985134229064, 0.00041071607847698033, 0.00053518230561167, 0.0006596485036425292, 0.0007841147016733885, 0.0009085809579119086, 0.0010330472141504288, 0.001157513353973627, 0.0012819796102121472, 0.0014064457500353456, 0.0015309120062738657, 0.001655378146097064, 0.0017798444023355842, 0.0019043106585741043, 0.0020287767983973026, 0.002153242938220501, 0.0022777090780436993, 0.0024021754506975412, 0.0025266415905207396, 0.002651107730343938, 0.00277557410299778, 0.002900040242820978, 0.0030245063826441765, 0.0031489727552980185, 0.0032734388951212168, 0.0033979052677750587, 0.003522371407598257, 0.0036468375474214554, 0.0037713036872446537, 0.0038957700598984957, 0.004020236432552338, 0.004144702572375536, 0.004269168712198734, 0.004393634852021933, 0.004518100991845131, 0.0046425675973296165, 0.004767033737152815, 0.004891499876976013, 0.0050159660167992115, 0.00514043215662241]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 25.0, 27.0, 47.0, 45.0, 91.0, 110.0, 95.0, 119.0, 111.0, 108.0, 58.0, 72.0, 36.0, 25.0, 16.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000614464282989502, -0.0005881385877728462, -0.0005618128925561905, -0.0005354871973395348, -0.000509161502122879, -0.0004828358069062233, -0.00045651011168956757, -0.00043018441647291183, -0.0004038587212562561, -0.00037753302603960037, -0.00035120733082294464, -0.0003248816356062889, -0.0002985559403896332, -0.00027223024517297745, -0.0002459045499563217, -0.00021957885473966599, -0.00019325315952301025, -0.00016692746430635452, -0.0001406017690896988, -0.00011427607387304306, -8.795037865638733e-05, -6.16246834397316e-05, -3.529898822307587e-05, -8.973293006420135e-06, 1.7352402210235596e-05, 4.367809742689133e-05, 7.000379264354706e-05, 9.632948786020279e-05, 0.00012265518307685852, 0.00014898087829351425, 0.00017530657351016998, 0.00020163226872682571, 0.00022795796394348145, 0.0002542836591601372, 0.0002806093543767929, 0.00030693504959344864, 0.00033326074481010437, 0.0003595864400267601, 0.00038591213524341583, 0.00041223783046007156, 0.0004385635256767273, 0.000464889220893383, 0.0004912149161100388, 0.0005175406113266945, 0.0005438663065433502, 0.000570192001760006, 0.0005965176969766617, 0.0006228433921933174, 0.0006491690874099731, 0.0006754947826266289, 0.0007018204778432846, 0.0007281461730599403, 0.0007544718682765961, 0.0007807975634932518, 0.0008071232587099075, 0.0008334489539265633, 0.000859774649143219, 0.0008861003443598747, 0.0009124260395765305, 0.0009387517347931862, 0.0009650774300098419, 0.0009914031252264977, 0.0010177288204431534, 0.0010440545156598091, 0.0010703802108764648]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 26.0, 26.0, 39.0, 60.0, 87.0, 112.0, 183.0, 286.0, 442.0, 713.0, 1110.0, 1725.0, 2808.0, 4499.0, 7322.0, 12758.0, 22015.0, 39626.0, 77505.0, 212852.0, 411952.0, 123761.0, 55892.0, 30201.0, 16921.0, 9912.0, 5858.0, 3646.0, 2276.0, 1395.0, 858.0, 539.0, 381.0, 256.0, 147.0, 110.0, 87.0, 44.0, 29.0, 26.0, 12.0, 16.0, 7.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.049072265625, -17.41064453125, -16.772216796875, -16.1337890625, -15.495361328125, -14.85693359375, -14.218505859375, -13.580078125, -12.941650390625, -12.30322265625, -11.664794921875, -11.0263671875, -10.387939453125, -9.74951171875, -9.111083984375, -8.47265625, -7.834228515625, -7.19580078125, -6.557373046875, -5.9189453125, -5.280517578125, -4.64208984375, -4.003662109375, -3.365234375, -2.726806640625, -2.08837890625, -1.449951171875, -0.8115234375, -0.173095703125, 0.46533203125, 1.103759765625, 1.7421875, 2.380615234375, 3.01904296875, 3.657470703125, 4.2958984375, 4.934326171875, 5.57275390625, 6.211181640625, 6.849609375, 7.488037109375, 8.12646484375, 8.764892578125, 9.4033203125, 10.041748046875, 10.68017578125, 11.318603515625, 11.95703125, 12.595458984375, 13.23388671875, 13.872314453125, 14.5107421875, 15.149169921875, 15.78759765625, 16.426025390625, 17.064453125, 17.702880859375, 18.34130859375, 18.979736328125, 19.6181640625, 20.256591796875, 20.89501953125, 21.533447265625, 22.171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 14.0, 4.0, 9.0, 6.0, 8.0, 11.0, 11.0, 17.0, 20.0, 23.0, 29.0, 28.0, 38.0, 25.0, 30.0, 44.0, 50.0, 90.0, 110.0, 225.0, 1526.0, 184.0, 95.0, 70.0, 41.0, 42.0, 42.0, 36.0, 33.0, 24.0, 23.0, 16.0, 23.0, 22.0, 22.0, 11.0, 8.0, 10.0, 8.0, 9.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53125, -37.34033203125, -36.1494140625, -34.95849609375, -33.767578125, -32.57666015625, -31.3857421875, -30.19482421875, -29.00390625, -27.81298828125, -26.6220703125, -25.43115234375, -24.240234375, -23.04931640625, -21.8583984375, -20.66748046875, -19.4765625, -18.28564453125, -17.0947265625, -15.90380859375, -14.712890625, -13.52197265625, -12.3310546875, -11.14013671875, -9.94921875, -8.75830078125, -7.5673828125, -6.37646484375, -5.185546875, -3.99462890625, -2.8037109375, -1.61279296875, -0.421875, 0.76904296875, 1.9599609375, 3.15087890625, 4.341796875, 5.53271484375, 6.7236328125, 7.91455078125, 9.10546875, 10.29638671875, 11.4873046875, 12.67822265625, 13.869140625, 15.06005859375, 16.2509765625, 17.44189453125, 18.6328125, 19.82373046875, 21.0146484375, 22.20556640625, 23.396484375, 24.58740234375, 25.7783203125, 26.96923828125, 28.16015625, 29.35107421875, 30.5419921875, 31.73291015625, 32.923828125, 34.11474609375, 35.3056640625, 36.49658203125, 37.6875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 7.0, 7.0, 13.0, 14.0, 21.0, 35.0, 47.0, 50.0, 92.0, 114.0, 199.0, 436.0, 932.0, 2114.0, 5822.0, 17492.0, 64994.0, 479842.0, 2391760.0, 135233.0, 30905.0, 9548.0, 3353.0, 1312.0, 604.0, 268.0, 157.0, 100.0, 57.0, 40.0, 34.0, 21.0, 22.0, 7.0, 15.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-46.0625, -44.716796875, -43.37109375, -42.025390625, -40.6796875, -39.333984375, -37.98828125, -36.642578125, -35.296875, -33.951171875, -32.60546875, -31.259765625, -29.9140625, -28.568359375, -27.22265625, -25.876953125, -24.53125, -23.185546875, -21.83984375, -20.494140625, -19.1484375, -17.802734375, -16.45703125, -15.111328125, -13.765625, -12.419921875, -11.07421875, -9.728515625, -8.3828125, -7.037109375, -5.69140625, -4.345703125, -3.0, -1.654296875, -0.30859375, 1.037109375, 2.3828125, 3.728515625, 5.07421875, 6.419921875, 7.765625, 9.111328125, 10.45703125, 11.802734375, 13.1484375, 14.494140625, 15.83984375, 17.185546875, 18.53125, 19.876953125, 21.22265625, 22.568359375, 23.9140625, 25.259765625, 26.60546875, 27.951171875, 29.296875, 30.642578125, 31.98828125, 33.333984375, 34.6796875, 36.025390625, 37.37109375, 38.716796875, 40.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 10.0, 37.0, 117.0, 233.0, 297.0, 210.0, 69.0, 29.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21734619140625, -40.668174743652344, -35.11900329589844, -29.569833755493164, -24.020662307739258, -18.47149085998535, -12.922321319580078, -7.373149871826172, -1.8239784240722656, 3.7251925468444824, 9.27436351776123, 14.82353401184082, 20.372705459594727, 25.921876907348633, 31.471046447753906, 37.02021789550781, 42.56938934326172, 48.118560791015625, 53.66773223876953, 59.21690368652344, 64.76607513427734, 70.31524658203125, 75.86441040039062, 81.41358947753906, 86.96275329589844, 92.51192474365234, 98.06109619140625, 103.61026763916016, 109.15943908691406, 114.70861053466797, 120.25778198242188, 125.80694580078125, 131.3561248779297, 136.90528869628906, 142.4544677734375, 148.00363159179688, 153.5528106689453, 159.1019744873047, 164.65115356445312, 170.2003173828125, 175.74949645996094, 181.2986602783203, 186.84783935546875, 192.39700317382812, 197.94618225097656, 203.49534606933594, 209.04452514648438, 214.59368896484375, 220.14285278320312, 225.6920166015625, 231.24119567871094, 236.7903594970703, 242.33953857421875, 247.88870239257812, 253.43788146972656, 258.987060546875, 264.5362243652344, 270.08538818359375, 275.6345520019531, 281.1837463378906, 286.73291015625, 292.2820739746094, 297.83123779296875, 303.38043212890625, 308.9295959472656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 9.0, 4.0, 13.0, 11.0, 13.0, 14.0, 20.0, 19.0, 21.0, 20.0, 26.0, 27.0, 36.0, 26.0, 28.0, 41.0, 42.0, 39.0, 40.0, 39.0, 40.0, 38.0, 40.0, 44.0, 39.0, 37.0, 39.0, 34.0, 27.0, 25.0, 19.0, 13.0, 23.0, 12.0, 11.0, 10.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-83.2530746459961, -80.60598754882812, -77.95890045166016, -75.31180572509766, -72.66471862792969, -70.01763153076172, -67.37054443359375, -64.72345733642578, -62.07636642456055, -59.42927932739258, -56.782188415527344, -54.135101318359375, -51.488014221191406, -48.84092330932617, -46.1938362121582, -43.54674530029297, -40.899658203125, -38.25257110595703, -35.6054801940918, -32.95839309692383, -30.311304092407227, -27.664215087890625, -25.017127990722656, -22.370038986206055, -19.722949981689453, -17.07586097717285, -14.428772926330566, -11.781684875488281, -9.13459587097168, -6.487506866455078, -3.840418815612793, -1.1933307647705078, 1.4537506103515625, 4.100839138031006, 6.747927665710449, 9.395015716552734, 12.042104721069336, 14.689193725585938, 17.336280822753906, 19.983369827270508, 22.63045883178711, 25.27754783630371, 27.924636840820312, 30.57172393798828, 33.21881103515625, 35.865901947021484, 38.51298904418945, 41.16007995605469, 43.807167053222656, 46.454254150390625, 49.10134506225586, 51.74843215942383, 54.39552307128906, 57.04261016845703, 59.689697265625, 62.33678436279297, 64.98387145996094, 67.6309585571289, 70.27804565429688, 72.92514038085938, 75.57222747802734, 78.21931457519531, 80.86640167236328, 83.51348876953125, 86.16058349609375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 7.0, 7.0, 9.0, 17.0, 15.0, 19.0, 23.0, 26.0, 38.0, 35.0, 34.0, 42.0, 48.0, 28.0, 48.0, 31.0, 46.0, 46.0, 42.0, 38.0, 41.0, 40.0, 34.0, 41.0, 25.0, 34.0, 37.0, 21.0, 22.0, 18.0, 18.0, 18.0, 12.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.46875, -16.945068359375, -16.42138671875, -15.897705078125, -15.3740234375, -14.850341796875, -14.32666015625, -13.802978515625, -13.279296875, -12.755615234375, -12.23193359375, -11.708251953125, -11.1845703125, -10.660888671875, -10.13720703125, -9.613525390625, -9.08984375, -8.566162109375, -8.04248046875, -7.518798828125, -6.9951171875, -6.471435546875, -5.94775390625, -5.424072265625, -4.900390625, -4.376708984375, -3.85302734375, -3.329345703125, -2.8056640625, -2.281982421875, -1.75830078125, -1.234619140625, -0.7109375, -0.187255859375, 0.33642578125, 0.860107421875, 1.3837890625, 1.907470703125, 2.43115234375, 2.954833984375, 3.478515625, 4.002197265625, 4.52587890625, 5.049560546875, 5.5732421875, 6.096923828125, 6.62060546875, 7.144287109375, 7.66796875, 8.191650390625, 8.71533203125, 9.239013671875, 9.7626953125, 10.286376953125, 10.81005859375, 11.333740234375, 11.857421875, 12.381103515625, 12.90478515625, 13.428466796875, 13.9521484375, 14.475830078125, 14.99951171875, 15.523193359375, 16.046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 7.0, 3.0, 6.0, 16.0, 14.0, 15.0, 31.0, 34.0, 52.0, 85.0, 94.0, 152.0, 227.0, 280.0, 475.0, 666.0, 974.0, 1382.0, 2244.0, 3529.0, 5793.0, 9683.0, 18152.0, 41369.0, 158389.0, 1085371.0, 2332195.0, 399417.0, 73431.0, 26566.0, 12915.0, 7614.0, 4514.0, 2865.0, 1859.0, 1236.0, 837.0, 584.0, 374.0, 261.0, 204.0, 98.0, 85.0, 59.0, 33.0, 25.0, 16.0, 21.0, 6.0, 11.0, 5.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.96484375, -22.1796875, -21.39453125, -20.609375, -19.82421875, -19.0390625, -18.25390625, -17.46875, -16.68359375, -15.8984375, -15.11328125, -14.328125, -13.54296875, -12.7578125, -11.97265625, -11.1875, -10.40234375, -9.6171875, -8.83203125, -8.046875, -7.26171875, -6.4765625, -5.69140625, -4.90625, -4.12109375, -3.3359375, -2.55078125, -1.765625, -0.98046875, -0.1953125, 0.58984375, 1.375, 2.16015625, 2.9453125, 3.73046875, 4.515625, 5.30078125, 6.0859375, 6.87109375, 7.65625, 8.44140625, 9.2265625, 10.01171875, 10.796875, 11.58203125, 12.3671875, 13.15234375, 13.9375, 14.72265625, 15.5078125, 16.29296875, 17.078125, 17.86328125, 18.6484375, 19.43359375, 20.21875, 21.00390625, 21.7890625, 22.57421875, 23.359375, 24.14453125, 24.9296875, 25.71484375, 26.5]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 11.0, 12.0, 11.0, 18.0, 16.0, 19.0, 29.0, 37.0, 45.0, 52.0, 71.0, 93.0, 158.0, 238.0, 476.0, 724.0, 734.0, 485.0, 273.0, 161.0, 97.0, 58.0, 43.0, 41.0, 29.0, 31.0, 14.0, 16.0, 8.0, 13.0, 6.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.59375, -26.8056640625, -26.017578125, -25.2294921875, -24.44140625, -23.6533203125, -22.865234375, -22.0771484375, -21.2890625, -20.5009765625, -19.712890625, -18.9248046875, -18.13671875, -17.3486328125, -16.560546875, -15.7724609375, -14.984375, -14.1962890625, -13.408203125, -12.6201171875, -11.83203125, -11.0439453125, -10.255859375, -9.4677734375, -8.6796875, -7.8916015625, -7.103515625, -6.3154296875, -5.52734375, -4.7392578125, -3.951171875, -3.1630859375, -2.375, -1.5869140625, -0.798828125, -0.0107421875, 0.77734375, 1.5654296875, 2.353515625, 3.1416015625, 3.9296875, 4.7177734375, 5.505859375, 6.2939453125, 7.08203125, 7.8701171875, 8.658203125, 9.4462890625, 10.234375, 11.0224609375, 11.810546875, 12.5986328125, 13.38671875, 14.1748046875, 14.962890625, 15.7509765625, 16.5390625, 17.3271484375, 18.115234375, 18.9033203125, 19.69140625, 20.4794921875, 21.267578125, 22.0556640625, 22.84375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 8.0, 12.0, 20.0, 19.0, 35.0, 54.0, 79.0, 98.0, 193.0, 336.0, 635.0, 1264.0, 2925.0, 6538.0, 16146.0, 47167.0, 193817.0, 2996149.0, 786148.0, 95417.0, 28165.0, 10486.0, 4446.0, 1969.0, 918.0, 500.0, 275.0, 141.0, 99.0, 65.0, 35.0, 35.0, 20.0, 13.0, 14.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-48.125, -46.7412109375, -45.357421875, -43.9736328125, -42.58984375, -41.2060546875, -39.822265625, -38.4384765625, -37.0546875, -35.6708984375, -34.287109375, -32.9033203125, -31.51953125, -30.1357421875, -28.751953125, -27.3681640625, -25.984375, -24.6005859375, -23.216796875, -21.8330078125, -20.44921875, -19.0654296875, -17.681640625, -16.2978515625, -14.9140625, -13.5302734375, -12.146484375, -10.7626953125, -9.37890625, -7.9951171875, -6.611328125, -5.2275390625, -3.84375, -2.4599609375, -1.076171875, 0.3076171875, 1.69140625, 3.0751953125, 4.458984375, 5.8427734375, 7.2265625, 8.6103515625, 9.994140625, 11.3779296875, 12.76171875, 14.1455078125, 15.529296875, 16.9130859375, 18.296875, 19.6806640625, 21.064453125, 22.4482421875, 23.83203125, 25.2158203125, 26.599609375, 27.9833984375, 29.3671875, 30.7509765625, 32.134765625, 33.5185546875, 34.90234375, 36.2861328125, 37.669921875, 39.0537109375, 40.4375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 46.0, 220.0, 510.0, 196.0, 34.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.16114807128906, -196.59690856933594, -182.0326690673828, -167.4684295654297, -152.90419006347656, -138.33995056152344, -123.77571105957031, -109.21147155761719, -94.64723205566406, -80.08299255371094, -65.51875305175781, -50.95451354980469, -36.39027404785156, -21.826034545898438, -7.2617950439453125, 7.3024444580078125, 21.866683959960938, 36.43092346191406, 50.99516296386719, 65.55940246582031, 80.12364196777344, 94.68788146972656, 109.25212097167969, 123.81636047363281, 138.38059997558594, 152.94483947753906, 167.5090789794922, 182.0733184814453, 196.63755798339844, 211.20179748535156, 225.7660369873047, 240.3302764892578, 254.89453125, 269.4587707519531, 284.02301025390625, 298.5872497558594, 313.1514892578125, 327.7157287597656, 342.27996826171875, 356.8442077636719, 371.408447265625, 385.9726867675781, 400.53692626953125, 415.1011657714844, 429.6654052734375, 444.2296447753906, 458.79388427734375, 473.3581237792969, 487.92236328125, 502.4866027832031, 517.0508422851562, 531.6151123046875, 546.1793212890625, 560.7435302734375, 575.3078002929688, 589.8720703125, 604.436279296875, 619.00048828125, 633.5647583007812, 648.1290283203125, 662.6932373046875, 677.2574462890625, 691.8217163085938, 706.385986328125, 720.9501953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 10.0, 9.0, 9.0, 19.0, 25.0, 16.0, 17.0, 22.0, 32.0, 30.0, 38.0, 32.0, 38.0, 38.0, 36.0, 33.0, 51.0, 45.0, 54.0, 55.0, 34.0, 32.0, 28.0, 26.0, 30.0, 29.0, 37.0, 29.0, 25.0, 19.0, 17.0, 15.0, 4.0, 6.0, 12.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.73143005371094, -70.1810302734375, -67.6306381225586, -65.08023834228516, -62.52984619140625, -59.97944641113281, -57.42905044555664, -54.87865447998047, -52.3282585144043, -49.777862548828125, -47.22746658325195, -44.67707061767578, -42.126670837402344, -39.57627868652344, -37.02587890625, -34.47548294067383, -31.925086975097656, -29.374691009521484, -26.824295043945312, -24.273897171020508, -21.723501205444336, -19.173105239868164, -16.62270736694336, -14.072311401367188, -11.521915435791016, -8.971519470214844, -6.4211225509643555, -3.8707261085510254, -1.3203296661376953, 1.2300662994384766, 3.780463218688965, 6.330860137939453, 8.881248474121094, 11.431644439697266, 13.982041358947754, 16.532438278198242, 19.082834243774414, 21.633230209350586, 24.18362808227539, 26.734024047851562, 29.284420013427734, 31.834815979003906, 34.38521194458008, 36.93560791015625, 39.48600769042969, 42.036399841308594, 44.58679962158203, 47.1371955871582, 49.687591552734375, 52.23798751831055, 54.78838348388672, 57.33877944946289, 59.88917541503906, 62.4395751953125, 64.9899673461914, 67.54036712646484, 70.09075927734375, 72.64115905761719, 75.1915512084961, 77.74195098876953, 80.29234313964844, 82.84274291992188, 85.39313507080078, 87.94353485107422, 90.49393463134766]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 21.0, 29.0, 39.0, 74.0, 100.0, 149.0, 211.0, 340.0, 492.0, 771.0, 1154.0, 1817.0, 2835.0, 4372.0, 6932.0, 11198.0, 17951.0, 29288.0, 47068.0, 76274.0, 123972.0, 214771.0, 201477.0, 117173.0, 71960.0, 44676.0, 27318.0, 17029.0, 10563.0, 6684.0, 4183.0, 2715.0, 1728.0, 1104.0, 712.0, 503.0, 291.0, 178.0, 154.0, 78.0, 42.0, 33.0, 27.0, 17.0, 9.0, 14.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.331787109375, -0.3213996887207031, -0.31101226806640625, -0.3006248474121094, -0.2902374267578125, -0.2798500061035156, -0.26946258544921875, -0.2590751647949219, -0.248687744140625, -0.23830032348632812, -0.22791290283203125, -0.21752548217773438, -0.2071380615234375, -0.19675064086914062, -0.18636322021484375, -0.17597579956054688, -0.16558837890625, -0.15520095825195312, -0.14481353759765625, -0.13442611694335938, -0.1240386962890625, -0.11365127563476562, -0.10326385498046875, -0.09287643432617188, -0.082489013671875, -0.07210159301757812, -0.06171417236328125, -0.051326751708984375, -0.0409393310546875, -0.030551910400390625, -0.02016448974609375, -0.009777069091796875, 0.0006103515625, 0.010997772216796875, 0.02138519287109375, 0.031772613525390625, 0.0421600341796875, 0.052547454833984375, 0.06293487548828125, 0.07332229614257812, 0.083709716796875, 0.09409713745117188, 0.10448455810546875, 0.11487197875976562, 0.1252593994140625, 0.13564682006835938, 0.14603424072265625, 0.15642166137695312, 0.16680908203125, 0.17719650268554688, 0.18758392333984375, 0.19797134399414062, 0.2083587646484375, 0.21874618530273438, 0.22913360595703125, 0.23952102661132812, 0.249908447265625, 0.2602958679199219, 0.27068328857421875, 0.2810707092285156, 0.2914581298828125, 0.3018455505371094, 0.31223297119140625, 0.3226203918457031, 0.3330078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 15.0, 10.0, 12.0, 17.0, 12.0, 19.0, 28.0, 24.0, 25.0, 33.0, 31.0, 39.0, 36.0, 40.0, 31.0, 46.0, 40.0, 1081.0, 39.0, 37.0, 45.0, 34.0, 26.0, 44.0, 35.0, 18.0, 32.0, 24.0, 28.0, 19.0, 16.0, 16.0, 10.0, 7.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2523193359375, -10.879638671875, -10.5069580078125, -10.13427734375, -9.7615966796875, -9.388916015625, -9.0162353515625, -8.6435546875, -8.2708740234375, -7.898193359375, -7.5255126953125, -7.15283203125, -6.7801513671875, -6.407470703125, -6.0347900390625, -5.662109375, -5.2894287109375, -4.916748046875, -4.5440673828125, -4.17138671875, -3.7987060546875, -3.426025390625, -3.0533447265625, -2.6806640625, -2.3079833984375, -1.935302734375, -1.5626220703125, -1.18994140625, -0.8172607421875, -0.444580078125, -0.0718994140625, 0.30078125, 0.6734619140625, 1.046142578125, 1.4188232421875, 1.79150390625, 2.1641845703125, 2.536865234375, 2.9095458984375, 3.2822265625, 3.6549072265625, 4.027587890625, 4.4002685546875, 4.77294921875, 5.1456298828125, 5.518310546875, 5.8909912109375, 6.263671875, 6.6363525390625, 7.009033203125, 7.3817138671875, 7.75439453125, 8.1270751953125, 8.499755859375, 8.8724365234375, 9.2451171875, 9.6177978515625, 9.990478515625, 10.3631591796875, 10.73583984375, 11.1085205078125, 11.481201171875, 11.8538818359375, 12.2265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 10.0, 20.0, 27.0, 34.0, 35.0, 77.0, 93.0, 161.0, 244.0, 315.0, 476.0, 749.0, 1088.0, 1545.0, 2277.0, 3284.0, 4856.0, 7444.0, 11406.0, 17423.0, 27365.0, 44119.0, 71367.0, 119476.0, 257228.0, 1206894.0, 121969.0, 71938.0, 44924.0, 28021.0, 17832.0, 11426.0, 7538.0, 4988.0, 3250.0, 2252.0, 1566.0, 1068.0, 752.0, 504.0, 349.0, 246.0, 165.0, 120.0, 72.0, 47.0, 34.0, 20.0, 9.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.192138671875, -0.18631935119628906, -0.18050003051757812, -0.1746807098388672, -0.16886138916015625, -0.1630420684814453, -0.15722274780273438, -0.15140342712402344, -0.1455841064453125, -0.13976478576660156, -0.13394546508789062, -0.1281261444091797, -0.12230682373046875, -0.11648750305175781, -0.11066818237304688, -0.10484886169433594, -0.099029541015625, -0.09321022033691406, -0.08739089965820312, -0.08157157897949219, -0.07575225830078125, -0.06993293762207031, -0.06411361694335938, -0.05829429626464844, -0.0524749755859375, -0.04665565490722656, -0.040836334228515625, -0.03501701354980469, -0.02919769287109375, -0.023378372192382812, -0.017559051513671875, -0.011739730834960938, -0.00592041015625, -0.0001010894775390625, 0.005718231201171875, 0.011537551879882812, 0.01735687255859375, 0.023176193237304688, 0.028995513916015625, 0.03481483459472656, 0.0406341552734375, 0.04645347595214844, 0.052272796630859375, 0.05809211730957031, 0.06391143798828125, 0.06973075866699219, 0.07555007934570312, 0.08136940002441406, 0.087188720703125, 0.09300804138183594, 0.09882736206054688, 0.10464668273925781, 0.11046600341796875, 0.11628532409667969, 0.12210464477539062, 0.12792396545410156, 0.1337432861328125, 0.13956260681152344, 0.14538192749023438, 0.1512012481689453, 0.15702056884765625, 0.1628398895263672, 0.16865921020507812, 0.17447853088378906, 0.1802978515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 7.0, 3.0, 4.0, 11.0, 18.0, 16.0, 22.0, 23.0, 29.0, 20.0, 28.0, 40.0, 43.0, 39.0, 66.0, 102.0, 111.0, 67.0, 55.0, 35.0, 42.0, 31.0, 20.0, 29.0, 16.0, 14.0, 13.0, 11.0, 12.0, 9.0, 9.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003871992230415344, -0.00037433207035064697, -0.0003614649176597595, -0.00034859776496887207, -0.0003357306122779846, -0.00032286345958709717, -0.0003099963068962097, -0.00029712915420532227, -0.0002842620015144348, -0.00027139484882354736, -0.0002585276961326599, -0.00024566054344177246, -0.000232793390750885, -0.00021992623805999756, -0.0002070590853691101, -0.00019419193267822266, -0.0001813247799873352, -0.00016845762729644775, -0.0001555904746055603, -0.00014272332191467285, -0.0001298561692237854, -0.00011698901653289795, -0.0001041218638420105, -9.125471115112305e-05, -7.83875584602356e-05, -6.552040576934814e-05, -5.265325307846069e-05, -3.978610038757324e-05, -2.691894769668579e-05, -1.405179500579834e-05, -1.1846423149108887e-06, 1.1682510375976562e-05, 2.4549663066864014e-05, 3.7416815757751465e-05, 5.0283968448638916e-05, 6.315112113952637e-05, 7.601827383041382e-05, 8.888542652130127e-05, 0.00010175257921218872, 0.00011461973190307617, 0.00012748688459396362, 0.00014035403728485107, 0.00015322118997573853, 0.00016608834266662598, 0.00017895549535751343, 0.00019182264804840088, 0.00020468980073928833, 0.00021755695343017578, 0.00023042410612106323, 0.00024329125881195068, 0.00025615841150283813, 0.0002690255641937256, 0.00028189271688461304, 0.0002947598695755005, 0.00030762702226638794, 0.0003204941749572754, 0.00033336132764816284, 0.0003462284803390503, 0.00035909563302993774, 0.0003719627857208252, 0.00038482993841171265, 0.0003976970911026001, 0.00041056424379348755, 0.000423431396484375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 12.0, 7.0, 14.0, 20.0, 14.0, 22.0, 37.0, 43.0, 59.0, 81.0, 133.0, 232.0, 540.0, 3175.0, 1023569.0, 18884.0, 799.0, 293.0, 172.0, 100.0, 69.0, 36.0, 43.0, 35.0, 25.0, 22.0, 19.0, 18.0, 2.0, 7.0, 5.0, 12.0, 6.0, 7.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00942230224609375, -0.00913381576538086, -0.008845329284667969, -0.008556842803955078, -0.008268356323242188, -0.007979869842529297, -0.007691383361816406, -0.007402896881103516, -0.007114410400390625, -0.006825923919677734, -0.006537437438964844, -0.006248950958251953, -0.0059604644775390625, -0.005671977996826172, -0.005383491516113281, -0.005095005035400391, -0.0048065185546875, -0.004518032073974609, -0.004229545593261719, -0.003941059112548828, -0.0036525726318359375, -0.003364086151123047, -0.0030755996704101562, -0.0027871131896972656, -0.002498626708984375, -0.0022101402282714844, -0.0019216537475585938, -0.0016331672668457031, -0.0013446807861328125, -0.0010561943054199219, -0.0007677078247070312, -0.0004792213439941406, -0.00019073486328125, 9.775161743164062e-05, 0.00038623809814453125, 0.0006747245788574219, 0.0009632110595703125, 0.0012516975402832031, 0.0015401840209960938, 0.0018286705017089844, 0.002117156982421875, 0.0024056434631347656, 0.0026941299438476562, 0.002982616424560547, 0.0032711029052734375, 0.003559589385986328, 0.0038480758666992188, 0.004136562347412109, 0.004425048828125, 0.004713535308837891, 0.005002021789550781, 0.005290508270263672, 0.0055789947509765625, 0.005867481231689453, 0.006155967712402344, 0.006444454193115234, 0.006732940673828125, 0.007021427154541016, 0.007309913635253906, 0.007598400115966797, 0.007886886596679688, 0.008175373077392578, 0.008463859558105469, 0.00875234603881836, 0.00904083251953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 262.0, 748.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024615549482405186, -0.0023176034446805716, -0.0021736519411206245, -0.0020297004375606775, -0.0018857489340007305, -0.0017417974304407835, -0.0015978459268808365, -0.0014538944233208895, -0.0013099429197609425, -0.0011659914162009954, -0.0010220399126410484, -0.0008780884090811014, -0.0007341369055211544, -0.0005901854019612074, -0.0004462338984012604, -0.00030228239484131336, -0.00015833089128136635, -1.4379387721419334e-05, 0.00012957211583852768, 0.0002735236193984747, 0.0004174751229584217, 0.0005614266265183687, 0.0007053781300783157, 0.0008493296336382627, 0.0009932811371982098, 0.0011372326407581568, 0.0012811841443181038, 0.0014251356478780508, 0.0015690871514379978, 0.0017130386549979448, 0.0018569901585578918, 0.002000941662117839, 0.0021448927000164986, 0.0022888442035764456, 0.0024327957071363926, 0.0025767472106963396, 0.0027206987142562866, 0.0028646502178162336, 0.0030086017213761806, 0.0031525532249361277, 0.0032965047284960747, 0.0034404562320560217, 0.0035844077356159687, 0.0037283592391759157, 0.0038723107427358627, 0.004016262479126453, 0.004160213749855757, 0.00430416502058506, 0.004448116756975651, 0.0045920684933662415, 0.004736019764095545, 0.004879971034824848, 0.005023922771215439, 0.0051678745076060295, 0.005311825778335333, 0.005455777049064636, 0.005599728785455227, 0.0057436805218458176, 0.005887631792575121, 0.006031583063304424, 0.006175534799695015, 0.006319486536085606, 0.006463437806814909, 0.006607389077544212, 0.006751340813934803]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 21.0, 30.0, 40.0, 63.0, 69.0, 77.0, 107.0, 106.0, 94.0, 83.0, 85.0, 64.0, 61.0, 29.0, 22.0, 16.0, 11.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043714046478271484, -0.0004170164465904236, -0.0003968924283981323, -0.00037676841020584106, -0.0003566443920135498, -0.00033652037382125854, -0.0003163963556289673, -0.000296272337436676, -0.00027614831924438477, -0.0002560243010520935, -0.00023590028285980225, -0.00021577626466751099, -0.00019565224647521973, -0.00017552822828292847, -0.0001554042100906372, -0.00013528019189834595, -0.00011515617370605469, -9.503215551376343e-05, -7.490813732147217e-05, -5.478411912918091e-05, -3.466010093688965e-05, -1.4536082744598389e-05, 5.587935447692871e-06, 2.571195363998413e-05, 4.583597183227539e-05, 6.595999002456665e-05, 8.608400821685791e-05, 0.00010620802640914917, 0.00012633204460144043, 0.0001464560627937317, 0.00016658008098602295, 0.0001867040991783142, 0.00020682811737060547, 0.00022695213556289673, 0.000247076153755188, 0.00026720017194747925, 0.0002873241901397705, 0.00030744820833206177, 0.00032757222652435303, 0.0003476962447166443, 0.00036782026290893555, 0.0003879442811012268, 0.00040806829929351807, 0.0004281923174858093, 0.0004483163356781006, 0.00046844035387039185, 0.0004885643720626831, 0.0005086883902549744, 0.0005288124084472656, 0.0005489364266395569, 0.0005690604448318481, 0.0005891844630241394, 0.0006093084812164307, 0.0006294324994087219, 0.0006495565176010132, 0.0006696805357933044, 0.0006898045539855957, 0.000709928572177887, 0.0007300525903701782, 0.0007501766085624695, 0.0007703006267547607, 0.000790424644947052, 0.0008105486631393433, 0.0008306726813316345, 0.0008507966995239258]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 13.0, 17.0, 20.0, 36.0, 53.0, 73.0, 110.0, 156.0, 238.0, 395.0, 572.0, 949.0, 1464.0, 2347.0, 3611.0, 5898.0, 9482.0, 16701.0, 31602.0, 72078.0, 239854.0, 445265.0, 118102.0, 45072.0, 22132.0, 12451.0, 7325.0, 4499.0, 2908.0, 1779.0, 1214.0, 682.0, 471.0, 324.0, 188.0, 156.0, 103.0, 64.0, 36.0, 32.0, 18.0, 16.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.59375, -19.97412109375, -19.3544921875, -18.73486328125, -18.115234375, -17.49560546875, -16.8759765625, -16.25634765625, -15.63671875, -15.01708984375, -14.3974609375, -13.77783203125, -13.158203125, -12.53857421875, -11.9189453125, -11.29931640625, -10.6796875, -10.06005859375, -9.4404296875, -8.82080078125, -8.201171875, -7.58154296875, -6.9619140625, -6.34228515625, -5.72265625, -5.10302734375, -4.4833984375, -3.86376953125, -3.244140625, -2.62451171875, -2.0048828125, -1.38525390625, -0.765625, -0.14599609375, 0.4736328125, 1.09326171875, 1.712890625, 2.33251953125, 2.9521484375, 3.57177734375, 4.19140625, 4.81103515625, 5.4306640625, 6.05029296875, 6.669921875, 7.28955078125, 7.9091796875, 8.52880859375, 9.1484375, 9.76806640625, 10.3876953125, 11.00732421875, 11.626953125, 12.24658203125, 12.8662109375, 13.48583984375, 14.10546875, 14.72509765625, 15.3447265625, 15.96435546875, 16.583984375, 17.20361328125, 17.8232421875, 18.44287109375, 19.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 11.0, 5.0, 3.0, 8.0, 16.0, 26.0, 28.0, 17.0, 35.0, 27.0, 44.0, 30.0, 30.0, 55.0, 76.0, 108.0, 205.0, 1585.0, 207.0, 92.0, 68.0, 56.0, 51.0, 40.0, 33.0, 37.0, 20.0, 27.0, 24.0, 21.0, 19.0, 7.0, 9.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.59375, -47.14599609375, -45.6982421875, -44.25048828125, -42.802734375, -41.35498046875, -39.9072265625, -38.45947265625, -37.01171875, -35.56396484375, -34.1162109375, -32.66845703125, -31.220703125, -29.77294921875, -28.3251953125, -26.87744140625, -25.4296875, -23.98193359375, -22.5341796875, -21.08642578125, -19.638671875, -18.19091796875, -16.7431640625, -15.29541015625, -13.84765625, -12.39990234375, -10.9521484375, -9.50439453125, -8.056640625, -6.60888671875, -5.1611328125, -3.71337890625, -2.265625, -0.81787109375, 0.6298828125, 2.07763671875, 3.525390625, 4.97314453125, 6.4208984375, 7.86865234375, 9.31640625, 10.76416015625, 12.2119140625, 13.65966796875, 15.107421875, 16.55517578125, 18.0029296875, 19.45068359375, 20.8984375, 22.34619140625, 23.7939453125, 25.24169921875, 26.689453125, 28.13720703125, 29.5849609375, 31.03271484375, 32.48046875, 33.92822265625, 35.3759765625, 36.82373046875, 38.271484375, 39.71923828125, 41.1669921875, 42.61474609375, 44.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 13.0, 3.0, 7.0, 16.0, 26.0, 31.0, 28.0, 40.0, 64.0, 92.0, 133.0, 219.0, 364.0, 941.0, 2336.0, 7172.0, 24958.0, 150872.0, 2749073.0, 170117.0, 26890.0, 7786.0, 2452.0, 953.0, 362.0, 246.0, 119.0, 108.0, 54.0, 36.0, 41.0, 33.0, 15.0, 16.0, 19.0, 13.0, 5.0, 7.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.34375, -50.734375, -49.125, -47.515625, -45.90625, -44.296875, -42.6875, -41.078125, -39.46875, -37.859375, -36.25, -34.640625, -33.03125, -31.421875, -29.8125, -28.203125, -26.59375, -24.984375, -23.375, -21.765625, -20.15625, -18.546875, -16.9375, -15.328125, -13.71875, -12.109375, -10.5, -8.890625, -7.28125, -5.671875, -4.0625, -2.453125, -0.84375, 0.765625, 2.375, 3.984375, 5.59375, 7.203125, 8.8125, 10.421875, 12.03125, 13.640625, 15.25, 16.859375, 18.46875, 20.078125, 21.6875, 23.296875, 24.90625, 26.515625, 28.125, 29.734375, 31.34375, 32.953125, 34.5625, 36.171875, 37.78125, 39.390625, 41.0, 42.609375, 44.21875, 45.828125, 47.4375, 49.046875, 50.65625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 47.0, 390.0, 494.0, 71.0, 10.0, 1.0, 1.0, 1.0], "bins": [-779.1015625, -765.6905517578125, -752.279541015625, -738.8685302734375, -725.4574584960938, -712.0464477539062, -698.6354370117188, -685.2244262695312, -671.8134155273438, -658.4024047851562, -644.9913940429688, -631.580322265625, -618.1693115234375, -604.75830078125, -591.3472900390625, -577.936279296875, -564.5252685546875, -551.1142578125, -537.7032470703125, -524.292236328125, -510.8811950683594, -497.47015380859375, -484.05914306640625, -470.64813232421875, -457.237060546875, -443.8260498046875, -430.4150085449219, -417.0039978027344, -403.5929870605469, -390.18194580078125, -376.77093505859375, -363.35992431640625, -349.9489440917969, -336.5379333496094, -323.12689208984375, -309.71588134765625, -296.30487060546875, -282.89385986328125, -269.4828186035156, -256.0718078613281, -242.66078186035156, -229.249755859375, -215.8387451171875, -202.42771911621094, -189.01669311523438, -175.60568237304688, -162.1946563720703, -148.78363037109375, -135.37261962890625, -121.96160125732422, -108.55058288574219, -95.13955688476562, -81.7285385131836, -68.31752014160156, -54.906494140625, -41.49547576904297, -28.084457397460938, -14.673437118530273, -1.2624168395996094, 12.148605346679688, 25.55962371826172, 38.97064208984375, 52.38166809082031, 65.79268646240234, 79.20370483398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 8.0, 6.0, 8.0, 16.0, 12.0, 11.0, 19.0, 19.0, 17.0, 16.0, 24.0, 24.0, 27.0, 29.0, 34.0, 26.0, 36.0, 40.0, 25.0, 37.0, 45.0, 37.0, 34.0, 38.0, 43.0, 41.0, 41.0, 33.0, 22.0, 34.0, 21.0, 15.0, 22.0, 23.0, 18.0, 19.0, 8.0, 9.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.95767211914062, -83.10855102539062, -80.25942993164062, -77.41031646728516, -74.56119537353516, -71.71207427978516, -68.86296081542969, -66.01383972167969, -63.16471862792969, -60.31559753417969, -57.46648025512695, -54.61736297607422, -51.76824188232422, -48.91912078857422, -46.070003509521484, -43.22088623046875, -40.37176513671875, -37.52264404296875, -34.673526763916016, -31.82440757751465, -28.97528839111328, -26.126169204711914, -23.277050018310547, -20.42793083190918, -17.578811645507812, -14.729692459106445, -11.880573272705078, -9.031454086303711, -6.182334899902344, -3.3332157135009766, -0.4840965270996094, 2.365022659301758, 5.214134216308594, 8.063253402709961, 10.912372589111328, 13.761491775512695, 16.610610961914062, 19.45973014831543, 22.308849334716797, 25.157968521118164, 28.00708770751953, 30.8562068939209, 33.705326080322266, 36.554443359375, 39.403564453125, 42.252685546875, 45.101802825927734, 47.95092010498047, 50.80004119873047, 53.64916229248047, 56.4982795715332, 59.34739685058594, 62.19651794433594, 65.04563903808594, 67.89476013183594, 70.7438735961914, 73.5929946899414, 76.4421157836914, 79.29122924804688, 82.14035034179688, 84.98947143554688, 87.83859252929688, 90.68771362304688, 93.53682708740234, 96.38594818115234]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 11.0, 10.0, 18.0, 22.0, 23.0, 24.0, 28.0, 33.0, 38.0, 29.0, 40.0, 35.0, 41.0, 42.0, 42.0, 49.0, 39.0, 48.0, 39.0, 62.0, 46.0, 40.0, 33.0, 18.0, 32.0, 26.0, 24.0, 27.0, 18.0, 14.0, 11.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.453125, -19.849853515625, -19.24658203125, -18.643310546875, -18.0400390625, -17.436767578125, -16.83349609375, -16.230224609375, -15.626953125, -15.023681640625, -14.42041015625, -13.817138671875, -13.2138671875, -12.610595703125, -12.00732421875, -11.404052734375, -10.80078125, -10.197509765625, -9.59423828125, -8.990966796875, -8.3876953125, -7.784423828125, -7.18115234375, -6.577880859375, -5.974609375, -5.371337890625, -4.76806640625, -4.164794921875, -3.5615234375, -2.958251953125, -2.35498046875, -1.751708984375, -1.1484375, -0.545166015625, 0.05810546875, 0.661376953125, 1.2646484375, 1.867919921875, 2.47119140625, 3.074462890625, 3.677734375, 4.281005859375, 4.88427734375, 5.487548828125, 6.0908203125, 6.694091796875, 7.29736328125, 7.900634765625, 8.50390625, 9.107177734375, 9.71044921875, 10.313720703125, 10.9169921875, 11.520263671875, 12.12353515625, 12.726806640625, 13.330078125, 13.933349609375, 14.53662109375, 15.139892578125, 15.7431640625, 16.346435546875, 16.94970703125, 17.552978515625, 18.15625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 14.0, 22.0, 28.0, 30.0, 35.0, 48.0, 58.0, 75.0, 85.0, 116.0, 183.0, 283.0, 652.0, 2020.0, 13444.0, 2764806.0, 1397797.0, 11174.0, 1758.0, 542.0, 298.0, 171.0, 133.0, 85.0, 64.0, 56.0, 47.0, 33.0, 24.0, 18.0, 19.0, 20.0, 16.0, 15.0, 14.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-128.875, -124.96484375, -121.0546875, -117.14453125, -113.234375, -109.32421875, -105.4140625, -101.50390625, -97.59375, -93.68359375, -89.7734375, -85.86328125, -81.953125, -78.04296875, -74.1328125, -70.22265625, -66.3125, -62.40234375, -58.4921875, -54.58203125, -50.671875, -46.76171875, -42.8515625, -38.94140625, -35.03125, -31.12109375, -27.2109375, -23.30078125, -19.390625, -15.48046875, -11.5703125, -7.66015625, -3.75, 0.16015625, 4.0703125, 7.98046875, 11.890625, 15.80078125, 19.7109375, 23.62109375, 27.53125, 31.44140625, 35.3515625, 39.26171875, 43.171875, 47.08203125, 50.9921875, 54.90234375, 58.8125, 62.72265625, 66.6328125, 70.54296875, 74.453125, 78.36328125, 82.2734375, 86.18359375, 90.09375, 94.00390625, 97.9140625, 101.82421875, 105.734375, 109.64453125, 113.5546875, 117.46484375, 121.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 15.0, 22.0, 20.0, 20.0, 38.0, 31.0, 50.0, 93.0, 133.0, 221.0, 306.0, 554.0, 756.0, 642.0, 361.0, 231.0, 128.0, 84.0, 65.0, 54.0, 35.0, 29.0, 27.0, 20.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-24.640625, -23.908935546875, -23.17724609375, -22.445556640625, -21.7138671875, -20.982177734375, -20.25048828125, -19.518798828125, -18.787109375, -18.055419921875, -17.32373046875, -16.592041015625, -15.8603515625, -15.128662109375, -14.39697265625, -13.665283203125, -12.93359375, -12.201904296875, -11.47021484375, -10.738525390625, -10.0068359375, -9.275146484375, -8.54345703125, -7.811767578125, -7.080078125, -6.348388671875, -5.61669921875, -4.885009765625, -4.1533203125, -3.421630859375, -2.68994140625, -1.958251953125, -1.2265625, -0.494873046875, 0.23681640625, 0.968505859375, 1.7001953125, 2.431884765625, 3.16357421875, 3.895263671875, 4.626953125, 5.358642578125, 6.09033203125, 6.822021484375, 7.5537109375, 8.285400390625, 9.01708984375, 9.748779296875, 10.48046875, 11.212158203125, 11.94384765625, 12.675537109375, 13.4072265625, 14.138916015625, 14.87060546875, 15.602294921875, 16.333984375, 17.065673828125, 17.79736328125, 18.529052734375, 19.2607421875, 19.992431640625, 20.72412109375, 21.455810546875, 22.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 11.0, 20.0, 24.0, 27.0, 31.0, 59.0, 86.0, 129.0, 224.0, 614.0, 1987.0, 7831.0, 43538.0, 983151.0, 3077974.0, 64004.0, 10664.0, 2467.0, 710.0, 309.0, 118.0, 89.0, 52.0, 37.0, 45.0, 19.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.1875, -70.833984375, -68.48046875, -66.126953125, -63.7734375, -61.419921875, -59.06640625, -56.712890625, -54.359375, -52.005859375, -49.65234375, -47.298828125, -44.9453125, -42.591796875, -40.23828125, -37.884765625, -35.53125, -33.177734375, -30.82421875, -28.470703125, -26.1171875, -23.763671875, -21.41015625, -19.056640625, -16.703125, -14.349609375, -11.99609375, -9.642578125, -7.2890625, -4.935546875, -2.58203125, -0.228515625, 2.125, 4.478515625, 6.83203125, 9.185546875, 11.5390625, 13.892578125, 16.24609375, 18.599609375, 20.953125, 23.306640625, 25.66015625, 28.013671875, 30.3671875, 32.720703125, 35.07421875, 37.427734375, 39.78125, 42.134765625, 44.48828125, 46.841796875, 49.1953125, 51.548828125, 53.90234375, 56.255859375, 58.609375, 60.962890625, 63.31640625, 65.669921875, 68.0234375, 70.376953125, 72.73046875, 75.083984375, 77.4375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 30.0, 318.0, 575.0, 81.0, 12.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.22539520263672, -56.66133117675781, -39.09726333618164, -21.53319549560547, -3.9691314697265625, 13.594932556152344, 31.15900421142578, 48.72306823730469, 66.2871322631836, 83.8511962890625, 101.41526794433594, 118.97933197021484, 136.54339599609375, 154.10745239257812, 171.67153930664062, 189.235595703125, 206.79965209960938, 224.3637237548828, 241.9277801513672, 259.4918518066406, 277.055908203125, 294.6199951171875, 312.1840515136719, 329.74810791015625, 347.31219482421875, 364.8762512207031, 382.4403381347656, 400.00439453125, 417.5684509277344, 435.13250732421875, 452.69659423828125, 470.2606506347656, 487.82476806640625, 505.3888244628906, 522.952880859375, 540.5169677734375, 558.0810546875, 575.6450805664062, 593.2091674804688, 610.7732543945312, 628.3372802734375, 645.9013671875, 663.4653930664062, 681.0294799804688, 698.5935668945312, 716.1575927734375, 733.7216796875, 751.2857666015625, 768.849853515625, 786.4139404296875, 803.9779663085938, 821.5420532226562, 839.1061401367188, 856.670166015625, 874.2342529296875, 891.79833984375, 909.3623657226562, 926.9264526367188, 944.490478515625, 962.0545654296875, 979.61865234375, 997.1826782226562, 1014.7467651367188, 1032.310791015625, 1049.8748779296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 12.0, 12.0, 18.0, 23.0, 19.0, 24.0, 28.0, 19.0, 31.0, 34.0, 46.0, 27.0, 42.0, 44.0, 35.0, 45.0, 51.0, 31.0, 45.0, 46.0, 36.0, 41.0, 44.0, 34.0, 30.0, 26.0, 20.0, 25.0, 28.0, 19.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-89.94453430175781, -87.46626281738281, -84.98799133300781, -82.50971221923828, -80.03144073486328, -77.55316925048828, -75.07489776611328, -72.59661865234375, -70.11834716796875, -67.64007568359375, -65.16180419921875, -62.683528900146484, -60.20525360107422, -57.72698211669922, -55.24871063232422, -52.77043533325195, -50.29216384887695, -47.81389236450195, -45.33561706542969, -42.85734558105469, -40.37907028198242, -37.90079879760742, -35.422523498535156, -32.944252014160156, -30.465978622436523, -27.98770523071289, -25.509431838989258, -23.031158447265625, -20.552886962890625, -18.07461166381836, -15.59634017944336, -13.118066787719727, -10.639793395996094, -8.161520004272461, -5.683247089385986, -3.2049741744995117, -0.7267007827758789, 1.751572608947754, 4.22984504699707, 6.708118438720703, 9.186391830444336, 11.664665222167969, 14.142938613891602, 16.621212005615234, 19.099483489990234, 21.5777587890625, 24.0560302734375, 26.534303665161133, 29.012577056884766, 31.4908504486084, 33.96912384033203, 36.44739532470703, 38.9256706237793, 41.4039421081543, 43.88221740722656, 46.36048889160156, 48.83876037597656, 51.31703186035156, 53.79530715942383, 56.27357864379883, 58.751853942871094, 61.230125427246094, 63.708396911621094, 66.18667602539062, 68.66494750976562]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 23.0, 22.0, 46.0, 67.0, 81.0, 127.0, 194.0, 319.0, 484.0, 747.0, 1242.0, 2112.0, 3394.0, 5707.0, 9716.0, 17037.0, 30133.0, 53334.0, 95703.0, 174369.0, 263436.0, 172646.0, 94221.0, 52546.0, 29770.0, 17031.0, 9626.0, 5690.0, 3331.0, 2030.0, 1271.0, 722.0, 484.0, 306.0, 198.0, 138.0, 82.0, 50.0, 29.0, 28.0, 12.0, 17.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.384033203125, -0.3718376159667969, -0.35964202880859375, -0.3474464416503906, -0.3352508544921875, -0.3230552673339844, -0.31085968017578125, -0.2986640930175781, -0.286468505859375, -0.2742729187011719, -0.26207733154296875, -0.24988174438476562, -0.2376861572265625, -0.22549057006835938, -0.21329498291015625, -0.20109939575195312, -0.18890380859375, -0.17670822143554688, -0.16451263427734375, -0.15231704711914062, -0.1401214599609375, -0.12792587280273438, -0.11573028564453125, -0.10353469848632812, -0.091339111328125, -0.07914352416992188, -0.06694793701171875, -0.054752349853515625, -0.0425567626953125, -0.030361175537109375, -0.01816558837890625, -0.005970001220703125, 0.0062255859375, 0.018421173095703125, 0.03061676025390625, 0.042812347412109375, 0.0550079345703125, 0.06720352172851562, 0.07939910888671875, 0.09159469604492188, 0.103790283203125, 0.11598587036132812, 0.12818145751953125, 0.14037704467773438, 0.1525726318359375, 0.16476821899414062, 0.17696380615234375, 0.18915939331054688, 0.20135498046875, 0.21355056762695312, 0.22574615478515625, 0.23794174194335938, 0.2501373291015625, 0.2623329162597656, 0.27452850341796875, 0.2867240905761719, 0.298919677734375, 0.3111152648925781, 0.32331085205078125, 0.3355064392089844, 0.3477020263671875, 0.3598976135253906, 0.37209320068359375, 0.3842887878417969, 0.396484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 8.0, 15.0, 10.0, 16.0, 17.0, 17.0, 28.0, 28.0, 28.0, 28.0, 33.0, 28.0, 44.0, 31.0, 35.0, 41.0, 41.0, 1058.0, 36.0, 51.0, 48.0, 38.0, 29.0, 32.0, 24.0, 34.0, 29.0, 25.0, 33.0, 16.0, 16.0, 20.0, 8.0, 12.0, 12.0, 10.0, 4.0, 5.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.01171875, -9.6640625, -9.31640625, -8.96875, -8.62109375, -8.2734375, -7.92578125, -7.578125, -7.23046875, -6.8828125, -6.53515625, -6.1875, -5.83984375, -5.4921875, -5.14453125, -4.796875, -4.44921875, -4.1015625, -3.75390625, -3.40625, -3.05859375, -2.7109375, -2.36328125, -2.015625, -1.66796875, -1.3203125, -0.97265625, -0.625, -0.27734375, 0.0703125, 0.41796875, 0.765625, 1.11328125, 1.4609375, 1.80859375, 2.15625, 2.50390625, 2.8515625, 3.19921875, 3.546875, 3.89453125, 4.2421875, 4.58984375, 4.9375, 5.28515625, 5.6328125, 5.98046875, 6.328125, 6.67578125, 7.0234375, 7.37109375, 7.71875, 8.06640625, 8.4140625, 8.76171875, 9.109375, 9.45703125, 9.8046875, 10.15234375, 10.5, 10.84765625, 11.1953125, 11.54296875, 11.890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 14.0, 35.0, 50.0, 91.0, 138.0, 204.0, 400.0, 595.0, 882.0, 1357.0, 2019.0, 3322.0, 5350.0, 8697.0, 14370.0, 23701.0, 39814.0, 67846.0, 120329.0, 233289.0, 1275200.0, 125342.0, 70060.0, 41203.0, 24498.0, 14439.0, 8934.0, 5454.0, 3475.0, 2125.0, 1397.0, 920.0, 613.0, 372.0, 235.0, 139.0, 84.0, 45.0, 18.0, 13.0, 11.0, 12.0, 4.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19811439514160156, -0.19151687622070312, -0.1849193572998047, -0.17832183837890625, -0.1717243194580078, -0.16512680053710938, -0.15852928161621094, -0.1519317626953125, -0.14533424377441406, -0.13873672485351562, -0.1321392059326172, -0.12554168701171875, -0.11894416809082031, -0.11234664916992188, -0.10574913024902344, -0.099151611328125, -0.09255409240722656, -0.08595657348632812, -0.07935905456542969, -0.07276153564453125, -0.06616401672363281, -0.059566497802734375, -0.05296897888183594, -0.0463714599609375, -0.03977394104003906, -0.033176422119140625, -0.026578903198242188, -0.01998138427734375, -0.013383865356445312, -0.006786346435546875, -0.0001888275146484375, 0.00640869140625, 0.013006210327148438, 0.019603729248046875, 0.026201248168945312, 0.03279876708984375, 0.03939628601074219, 0.045993804931640625, 0.05259132385253906, 0.0591888427734375, 0.06578636169433594, 0.07238388061523438, 0.07898139953613281, 0.08557891845703125, 0.09217643737792969, 0.09877395629882812, 0.10537147521972656, 0.111968994140625, 0.11856651306152344, 0.12516403198242188, 0.1317615509033203, 0.13835906982421875, 0.1449565887451172, 0.15155410766601562, 0.15815162658691406, 0.1647491455078125, 0.17134666442871094, 0.17794418334960938, 0.1845417022705078, 0.19113922119140625, 0.1977367401123047, 0.20433425903320312, 0.21093177795410156, 0.217529296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 6.0, 14.0, 16.0, 18.0, 36.0, 50.0, 54.0, 82.0, 141.0, 147.0, 107.0, 81.0, 59.0, 45.0, 28.0, 19.0, 20.0, 13.0, 7.0, 7.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003809928894042969, -0.0003670230507850647, -0.0003530532121658325, -0.00033908337354660034, -0.00032511353492736816, -0.000311143696308136, -0.0002971738576889038, -0.00028320401906967163, -0.00026923418045043945, -0.0002552643418312073, -0.0002412945032119751, -0.00022732466459274292, -0.00021335482597351074, -0.00019938498735427856, -0.0001854151487350464, -0.0001714453101158142, -0.00015747547149658203, -0.00014350563287734985, -0.00012953579425811768, -0.0001155659556388855, -0.00010159611701965332, -8.762627840042114e-05, -7.365643978118896e-05, -5.968660116195679e-05, -4.571676254272461e-05, -3.174692392349243e-05, -1.7777085304260254e-05, -3.807246685028076e-06, 1.0162591934204102e-05, 2.413243055343628e-05, 3.810226917266846e-05, 5.2072107791900635e-05, 6.604194641113281e-05, 8.001178503036499e-05, 9.398162364959717e-05, 0.00010795146226882935, 0.00012192130088806152, 0.0001358911395072937, 0.00014986097812652588, 0.00016383081674575806, 0.00017780065536499023, 0.0001917704939842224, 0.0002057403326034546, 0.00021971017122268677, 0.00023368000984191895, 0.0002476498484611511, 0.0002616196870803833, 0.0002755895256996155, 0.00028955936431884766, 0.00030352920293807983, 0.000317499041557312, 0.0003314688801765442, 0.00034543871879577637, 0.00035940855741500854, 0.0003733783960342407, 0.0003873482346534729, 0.0004013180732727051, 0.00041528791189193726, 0.00042925775051116943, 0.0004432275891304016, 0.0004571974277496338, 0.00047116726636886597, 0.00048513710498809814, 0.0004991069436073303, 0.0005130767822265625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 20.0, 33.0, 38.0, 57.0, 94.0, 166.0, 358.0, 1598.0, 1023800.0, 21245.0, 555.0, 227.0, 108.0, 71.0, 38.0, 19.0, 24.0, 12.0, 8.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0111846923828125, -0.010880231857299805, -0.01057577133178711, -0.010271310806274414, -0.009966850280761719, -0.009662389755249023, -0.009357929229736328, -0.009053468704223633, -0.008749008178710938, -0.008444547653198242, -0.008140087127685547, -0.007835626602172852, -0.007531166076660156, -0.007226705551147461, -0.006922245025634766, -0.00661778450012207, -0.006313323974609375, -0.00600886344909668, -0.005704402923583984, -0.005399942398071289, -0.005095481872558594, -0.0047910213470458984, -0.004486560821533203, -0.004182100296020508, -0.0038776397705078125, -0.003573179244995117, -0.003268718719482422, -0.0029642581939697266, -0.0026597976684570312, -0.002355337142944336, -0.0020508766174316406, -0.0017464160919189453, -0.00144195556640625, -0.0011374950408935547, -0.0008330345153808594, -0.0005285739898681641, -0.00022411346435546875, 8.034706115722656e-05, 0.0003848075866699219, 0.0006892681121826172, 0.0009937286376953125, 0.0012981891632080078, 0.0016026496887207031, 0.0019071102142333984, 0.0022115707397460938, 0.002516031265258789, 0.0028204917907714844, 0.0031249523162841797, 0.003429412841796875, 0.0037338733673095703, 0.004038333892822266, 0.004342794418334961, 0.004647254943847656, 0.0049517154693603516, 0.005256175994873047, 0.005560636520385742, 0.0058650970458984375, 0.006169557571411133, 0.006474018096923828, 0.0067784786224365234, 0.007082939147949219, 0.007387399673461914, 0.007691860198974609, 0.007996320724487305, 0.00830078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 17.0, 251.0, 689.0, 45.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012884201714769006, -0.001239330624230206, -0.0011902411933988333, -0.0011411516461521387, -0.0010920620989054441, -0.0010429726680740714, -0.0009938831208273768, -0.0009447936317883432, -0.0008957041427493095, -0.0008466146537102759, -0.0007975251646712422, -0.0007484356174245477, -0.000699346128385514, -0.0006502566393464804, -0.0006011670920997858, -0.0005520776030607522, -0.0005029881140217185, -0.00045389862498268485, -0.00040480910683982074, -0.00035571958869695663, -0.000306630099657923, -0.00025754061061888933, -0.00020845109247602522, -0.00015936157433316112, -0.00011027208529412746, -6.118258170317858e-05, -1.2093078112229705e-05, 3.6996425478719175e-05, 8.608592906966805e-05, 0.0001351754181087017, 0.00018426493625156581, 0.00023335445439442992, 0.0002824440598487854, 0.00033153354888781905, 0.00038062306703068316, 0.00042971258517354727, 0.0004788020742125809, 0.0005278915632516146, 0.0005769811104983091, 0.0006260705995373428, 0.0006751600885763764, 0.0007242495776154101, 0.0007733390666544437, 0.0008224286139011383, 0.000871518102940172, 0.0009206075919792056, 0.0009696971392259002, 0.001018786570057273, 0.0010678761173039675, 0.001116965664550662, 0.0011660550953820348, 0.0012151446426287293, 0.001264234073460102, 0.0013133236207067966, 0.0013624131679534912, 0.0014115027152001858, 0.0014605921460315585, 0.001509681693278253, 0.0015587711241096258, 0.0016078606713563204, 0.001656950218603015, 0.0017060396494343877, 0.0017551291966810822, 0.001804218627512455, 0.0018533081747591496]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 10.0, 15.0, 27.0, 39.0, 52.0, 62.0, 63.0, 61.0, 92.0, 79.0, 67.0, 89.0, 69.0, 62.0, 53.0, 46.0, 37.0, 28.0, 16.0, 12.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00040787458419799805, -0.000395849347114563, -0.00038382411003112793, -0.00037179887294769287, -0.0003597736358642578, -0.00034774839878082275, -0.0003357231616973877, -0.00032369792461395264, -0.0003116726875305176, -0.0002996474504470825, -0.00028762221336364746, -0.0002755969762802124, -0.00026357173919677734, -0.0002515465021133423, -0.00023952126502990723, -0.00022749602794647217, -0.0002154707908630371, -0.00020344555377960205, -0.000191420316696167, -0.00017939507961273193, -0.00016736984252929688, -0.00015534460544586182, -0.00014331936836242676, -0.0001312941312789917, -0.00011926889419555664, -0.00010724365711212158, -9.521842002868652e-05, -8.319318294525146e-05, -7.11679458618164e-05, -5.914270877838135e-05, -4.711747169494629e-05, -3.509223461151123e-05, -2.3066997528076172e-05, -1.1041760444641113e-05, 9.834766387939453e-07, 1.3008713722229004e-05, 2.5033950805664062e-05, 3.705918788909912e-05, 4.908442497253418e-05, 6.110966205596924e-05, 7.31348991394043e-05, 8.516013622283936e-05, 9.718537330627441e-05, 0.00010921061038970947, 0.00012123584747314453, 0.0001332610845565796, 0.00014528632164001465, 0.0001573115587234497, 0.00016933679580688477, 0.00018136203289031982, 0.00019338726997375488, 0.00020541250705718994, 0.000217437744140625, 0.00022946298122406006, 0.00024148821830749512, 0.0002535134553909302, 0.00026553869247436523, 0.0002775639295578003, 0.00028958916664123535, 0.0003016144037246704, 0.00031363964080810547, 0.00032566487789154053, 0.0003376901149749756, 0.00034971535205841064, 0.0003617405891418457]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 8.0, 4.0, 8.0, 10.0, 20.0, 25.0, 40.0, 44.0, 70.0, 107.0, 157.0, 263.0, 368.0, 580.0, 847.0, 1306.0, 2170.0, 3275.0, 5781.0, 10134.0, 19279.0, 41619.0, 104142.0, 313633.0, 339631.0, 113461.0, 44762.0, 20934.0, 10408.0, 5877.0, 3441.0, 2190.0, 1381.0, 833.0, 566.0, 372.0, 253.0, 177.0, 132.0, 72.0, 50.0, 51.0, 19.0, 19.0, 10.0, 12.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.654052734375, -19.91748046875, -19.180908203125, -18.4443359375, -17.707763671875, -16.97119140625, -16.234619140625, -15.498046875, -14.761474609375, -14.02490234375, -13.288330078125, -12.5517578125, -11.815185546875, -11.07861328125, -10.342041015625, -9.60546875, -8.868896484375, -8.13232421875, -7.395751953125, -6.6591796875, -5.922607421875, -5.18603515625, -4.449462890625, -3.712890625, -2.976318359375, -2.23974609375, -1.503173828125, -0.7666015625, -0.030029296875, 0.70654296875, 1.443115234375, 2.1796875, 2.916259765625, 3.65283203125, 4.389404296875, 5.1259765625, 5.862548828125, 6.59912109375, 7.335693359375, 8.072265625, 8.808837890625, 9.54541015625, 10.281982421875, 11.0185546875, 11.755126953125, 12.49169921875, 13.228271484375, 13.96484375, 14.701416015625, 15.43798828125, 16.174560546875, 16.9111328125, 17.647705078125, 18.38427734375, 19.120849609375, 19.857421875, 20.593994140625, 21.33056640625, 22.067138671875, 22.8037109375, 23.540283203125, 24.27685546875, 25.013427734375, 25.75]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 10.0, 13.0, 16.0, 25.0, 21.0, 26.0, 38.0, 37.0, 40.0, 54.0, 55.0, 89.0, 138.0, 1510.0, 390.0, 140.0, 72.0, 71.0, 47.0, 46.0, 37.0, 26.0, 29.0, 21.0, 18.0, 14.0, 14.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.37158203125, -45.9306640625, -44.48974609375, -43.048828125, -41.60791015625, -40.1669921875, -38.72607421875, -37.28515625, -35.84423828125, -34.4033203125, -32.96240234375, -31.521484375, -30.08056640625, -28.6396484375, -27.19873046875, -25.7578125, -24.31689453125, -22.8759765625, -21.43505859375, -19.994140625, -18.55322265625, -17.1123046875, -15.67138671875, -14.23046875, -12.78955078125, -11.3486328125, -9.90771484375, -8.466796875, -7.02587890625, -5.5849609375, -4.14404296875, -2.703125, -1.26220703125, 0.1787109375, 1.61962890625, 3.060546875, 4.50146484375, 5.9423828125, 7.38330078125, 8.82421875, 10.26513671875, 11.7060546875, 13.14697265625, 14.587890625, 16.02880859375, 17.4697265625, 18.91064453125, 20.3515625, 21.79248046875, 23.2333984375, 24.67431640625, 26.115234375, 27.55615234375, 28.9970703125, 30.43798828125, 31.87890625, 33.31982421875, 34.7607421875, 36.20166015625, 37.642578125, 39.08349609375, 40.5244140625, 41.96533203125, 43.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 15.0, 24.0, 22.0, 29.0, 68.0, 121.0, 173.0, 350.0, 952.0, 8855.0, 3044388.0, 87297.0, 2198.0, 548.0, 254.0, 107.0, 75.0, 60.0, 32.0, 28.0, 20.0, 9.0, 14.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-185.875, -181.1982421875, -176.521484375, -171.8447265625, -167.16796875, -162.4912109375, -157.814453125, -153.1376953125, -148.4609375, -143.7841796875, -139.107421875, -134.4306640625, -129.75390625, -125.0771484375, -120.400390625, -115.7236328125, -111.046875, -106.3701171875, -101.693359375, -97.0166015625, -92.33984375, -87.6630859375, -82.986328125, -78.3095703125, -73.6328125, -68.9560546875, -64.279296875, -59.6025390625, -54.92578125, -50.2490234375, -45.572265625, -40.8955078125, -36.21875, -31.5419921875, -26.865234375, -22.1884765625, -17.51171875, -12.8349609375, -8.158203125, -3.4814453125, 1.1953125, 5.8720703125, 10.548828125, 15.2255859375, 19.90234375, 24.5791015625, 29.255859375, 33.9326171875, 38.609375, 43.2861328125, 47.962890625, 52.6396484375, 57.31640625, 61.9931640625, 66.669921875, 71.3466796875, 76.0234375, 80.7001953125, 85.376953125, 90.0537109375, 94.73046875, 99.4072265625, 104.083984375, 108.7607421875, 113.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 19.0, 679.0, 311.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.6768493652344, -420.7241516113281, -395.771484375, -370.81878662109375, -345.8660888671875, -320.9134216308594, -295.9607238769531, -271.008056640625, -246.05535888671875, -221.10267639160156, -196.14999389648438, -171.19729614257812, -146.24461364746094, -121.29193115234375, -96.3392333984375, -71.38655090332031, -46.433868408203125, -21.481182098388672, 3.4715042114257812, 28.4241943359375, 53.37687683105469, 78.32955932617188, 103.28225708007812, 128.2349395751953, 153.1876220703125, 178.1403045654297, 203.09298706054688, 228.04568481445312, 252.9983673095703, 277.9510498046875, 302.90374755859375, 327.8564453125, 352.80908203125, 377.76177978515625, 402.7144470214844, 427.6671447753906, 452.61981201171875, 477.572509765625, 502.52520751953125, 527.4779052734375, 552.4305419921875, 577.3832397460938, 602.3359375, 627.28857421875, 652.2412719726562, 677.1939697265625, 702.1466674804688, 727.099365234375, 752.0520629882812, 777.0047607421875, 801.9574584960938, 826.91015625, 851.86279296875, 876.8154907226562, 901.7681884765625, 926.7208862304688, 951.673583984375, 976.6262817382812, 1001.5789794921875, 1026.5316162109375, 1051.484375, 1076.43701171875, 1101.3896484375, 1126.3424072265625, 1151.2950439453125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 8.0, 10.0, 10.0, 26.0, 24.0, 16.0, 27.0, 38.0, 21.0, 34.0, 44.0, 43.0, 30.0, 36.0, 43.0, 43.0, 53.0, 51.0, 27.0, 52.0, 38.0, 23.0, 46.0, 38.0, 30.0, 28.0, 31.0, 20.0, 20.0, 9.0, 13.0, 14.0, 8.0, 8.0, 3.0, 4.0, 12.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.79092407226562, -101.34465789794922, -97.89839172363281, -94.4521255493164, -91.005859375, -87.5595932006836, -84.11332702636719, -80.66705322265625, -77.22079467773438, -73.77452850341797, -70.32826232910156, -66.88199615478516, -63.43572998046875, -59.989463806152344, -56.54319381713867, -53.096927642822266, -49.650657653808594, -46.20439147949219, -42.75812530517578, -39.311859130859375, -35.86559295654297, -32.41932678222656, -28.97305679321289, -25.526790618896484, -22.080524444580078, -18.634258270263672, -15.18799114227295, -11.741724014282227, -8.29545783996582, -4.849191665649414, -1.402923583984375, 2.0433425903320312, 5.4896087646484375, 8.935874938964844, 12.382142066955566, 15.828409194946289, 19.274675369262695, 22.7209415435791, 26.16720962524414, 29.613475799560547, 33.05974197387695, 36.50600814819336, 39.952274322509766, 43.39854431152344, 46.844810485839844, 50.29107666015625, 53.737342834472656, 57.18360900878906, 60.62987518310547, 64.07614135742188, 67.52240753173828, 70.96867370605469, 74.4149398803711, 77.8612060546875, 81.30747985839844, 84.75373840332031, 88.20001220703125, 91.64627838134766, 95.09254455566406, 98.53881072998047, 101.98507690429688, 105.43134307861328, 108.87760925292969, 112.32388305664062, 115.7701416015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 10.0, 15.0, 13.0, 27.0, 27.0, 25.0, 28.0, 48.0, 43.0, 39.0, 36.0, 43.0, 40.0, 47.0, 42.0, 62.0, 47.0, 47.0, 40.0, 49.0, 37.0, 31.0, 24.0, 19.0, 21.0, 19.0, 15.0, 27.0, 14.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.940185546875, -18.33349609375, -17.726806640625, -17.1201171875, -16.513427734375, -15.90673828125, -15.300048828125, -14.693359375, -14.086669921875, -13.47998046875, -12.873291015625, -12.2666015625, -11.659912109375, -11.05322265625, -10.446533203125, -9.83984375, -9.233154296875, -8.62646484375, -8.019775390625, -7.4130859375, -6.806396484375, -6.19970703125, -5.593017578125, -4.986328125, -4.379638671875, -3.77294921875, -3.166259765625, -2.5595703125, -1.952880859375, -1.34619140625, -0.739501953125, -0.1328125, 0.473876953125, 1.08056640625, 1.687255859375, 2.2939453125, 2.900634765625, 3.50732421875, 4.114013671875, 4.720703125, 5.327392578125, 5.93408203125, 6.540771484375, 7.1474609375, 7.754150390625, 8.36083984375, 8.967529296875, 9.57421875, 10.180908203125, 10.78759765625, 11.394287109375, 12.0009765625, 12.607666015625, 13.21435546875, 13.821044921875, 14.427734375, 15.034423828125, 15.64111328125, 16.247802734375, 16.8544921875, 17.461181640625, 18.06787109375, 18.674560546875, 19.28125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 10.0, 12.0, 21.0, 19.0, 27.0, 41.0, 44.0, 64.0, 82.0, 135.0, 178.0, 229.0, 385.0, 609.0, 1057.0, 1811.0, 3547.0, 8579.0, 35584.0, 420803.0, 2603901.0, 1001839.0, 90254.0, 14431.0, 4797.0, 2366.0, 1258.0, 763.0, 445.0, 280.0, 206.0, 151.0, 94.0, 54.0, 48.0, 32.0, 22.0, 21.0, 19.0, 16.0, 14.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25, -32.23291015625, -31.2158203125, -30.19873046875, -29.181640625, -28.16455078125, -27.1474609375, -26.13037109375, -25.11328125, -24.09619140625, -23.0791015625, -22.06201171875, -21.044921875, -20.02783203125, -19.0107421875, -17.99365234375, -16.9765625, -15.95947265625, -14.9423828125, -13.92529296875, -12.908203125, -11.89111328125, -10.8740234375, -9.85693359375, -8.83984375, -7.82275390625, -6.8056640625, -5.78857421875, -4.771484375, -3.75439453125, -2.7373046875, -1.72021484375, -0.703125, 0.31396484375, 1.3310546875, 2.34814453125, 3.365234375, 4.38232421875, 5.3994140625, 6.41650390625, 7.43359375, 8.45068359375, 9.4677734375, 10.48486328125, 11.501953125, 12.51904296875, 13.5361328125, 14.55322265625, 15.5703125, 16.58740234375, 17.6044921875, 18.62158203125, 19.638671875, 20.65576171875, 21.6728515625, 22.68994140625, 23.70703125, 24.72412109375, 25.7412109375, 26.75830078125, 27.775390625, 28.79248046875, 29.8095703125, 30.82666015625, 31.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 4.0, 19.0, 11.0, 18.0, 15.0, 32.0, 38.0, 56.0, 58.0, 101.0, 140.0, 252.0, 344.0, 559.0, 680.0, 556.0, 360.0, 217.0, 171.0, 107.0, 80.0, 61.0, 49.0, 28.0, 30.0, 26.0, 14.0, 8.0, 11.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.587890625, -24.69140625, -23.794921875, -22.8984375, -22.001953125, -21.10546875, -20.208984375, -19.3125, -18.416015625, -17.51953125, -16.623046875, -15.7265625, -14.830078125, -13.93359375, -13.037109375, -12.140625, -11.244140625, -10.34765625, -9.451171875, -8.5546875, -7.658203125, -6.76171875, -5.865234375, -4.96875, -4.072265625, -3.17578125, -2.279296875, -1.3828125, -0.486328125, 0.41015625, 1.306640625, 2.203125, 3.099609375, 3.99609375, 4.892578125, 5.7890625, 6.685546875, 7.58203125, 8.478515625, 9.375, 10.271484375, 11.16796875, 12.064453125, 12.9609375, 13.857421875, 14.75390625, 15.650390625, 16.546875, 17.443359375, 18.33984375, 19.236328125, 20.1328125, 21.029296875, 21.92578125, 22.822265625, 23.71875, 24.615234375, 25.51171875, 26.408203125, 27.3046875, 28.201171875, 29.09765625, 29.994140625, 30.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 12.0, 27.0, 28.0, 42.0, 76.0, 93.0, 147.0, 253.0, 466.0, 841.0, 1858.0, 4249.0, 11680.0, 40257.0, 203027.0, 2722548.0, 1058032.0, 110509.0, 25680.0, 8228.0, 3176.0, 1335.0, 707.0, 368.0, 238.0, 138.0, 73.0, 56.0, 46.0, 25.0, 17.0, 11.0, 5.0, 11.0, 3.0, 7.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.69482421875, -35.5771484375, -34.45947265625, -33.341796875, -32.22412109375, -31.1064453125, -29.98876953125, -28.87109375, -27.75341796875, -26.6357421875, -25.51806640625, -24.400390625, -23.28271484375, -22.1650390625, -21.04736328125, -19.9296875, -18.81201171875, -17.6943359375, -16.57666015625, -15.458984375, -14.34130859375, -13.2236328125, -12.10595703125, -10.98828125, -9.87060546875, -8.7529296875, -7.63525390625, -6.517578125, -5.39990234375, -4.2822265625, -3.16455078125, -2.046875, -0.92919921875, 0.1884765625, 1.30615234375, 2.423828125, 3.54150390625, 4.6591796875, 5.77685546875, 6.89453125, 8.01220703125, 9.1298828125, 10.24755859375, 11.365234375, 12.48291015625, 13.6005859375, 14.71826171875, 15.8359375, 16.95361328125, 18.0712890625, 19.18896484375, 20.306640625, 21.42431640625, 22.5419921875, 23.65966796875, 24.77734375, 25.89501953125, 27.0126953125, 28.13037109375, 29.248046875, 30.36572265625, 31.4833984375, 32.60107421875, 33.71875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 17.0, 76.0, 195.0, 324.0, 264.0, 88.0, 33.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.43685913085938, -109.78137969970703, -101.12590026855469, -92.47042083740234, -83.81494140625, -75.15946197509766, -66.50398254394531, -57.84850311279297, -49.193023681640625, -40.53754425048828, -31.882064819335938, -23.226585388183594, -14.57110595703125, -5.915626525878906, 2.7398529052734375, 11.395332336425781, 20.050811767578125, 28.70629119873047, 37.36177062988281, 46.017250061035156, 54.6727294921875, 63.328208923339844, 71.98368835449219, 80.63916778564453, 89.29464721679688, 97.95012664794922, 106.60560607910156, 115.2610855102539, 123.91656494140625, 132.57205200195312, 141.22752380371094, 149.88299560546875, 158.53848266601562, 167.1939697265625, 175.8494415283203, 184.50491333007812, 193.160400390625, 201.81588745117188, 210.4713592529297, 219.1268310546875, 227.78231811523438, 236.43780517578125, 245.09327697753906, 253.74874877929688, 262.40423583984375, 271.0597229003906, 279.7152099609375, 288.37066650390625, 297.0261535644531, 305.681640625, 314.33709716796875, 322.9925842285156, 331.6480712890625, 340.3035583496094, 348.95904541015625, 357.614501953125, 366.2699890136719, 374.92547607421875, 383.5809326171875, 392.2364196777344, 400.89190673828125, 409.5473937988281, 418.202880859375, 426.85833740234375, 435.5138244628906]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 6.0, 12.0, 9.0, 12.0, 9.0, 18.0, 25.0, 27.0, 24.0, 29.0, 39.0, 35.0, 30.0, 25.0, 46.0, 37.0, 52.0, 48.0, 47.0, 28.0, 43.0, 48.0, 41.0, 41.0, 34.0, 38.0, 26.0, 27.0, 27.0, 24.0, 12.0, 11.0, 11.0, 14.0, 9.0, 6.0, 5.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-101.22217559814453, -98.37931060791016, -95.53643798828125, -92.69357299804688, -89.8507080078125, -87.0078353881836, -84.16497039794922, -81.32209777832031, -78.47923278808594, -75.63636779785156, -72.79349517822266, -69.95063018798828, -67.10775756835938, -64.264892578125, -61.422027587890625, -58.579158782958984, -55.736289978027344, -52.8934211730957, -50.05055236816406, -47.20768737792969, -44.36481857299805, -41.521949768066406, -38.67908477783203, -35.83621597290039, -32.99334716796875, -30.15047836303711, -27.3076114654541, -24.464744567871094, -21.621875762939453, -18.779006958007812, -15.936140060424805, -13.093273162841797, -10.250411987304688, -7.407544136047363, -4.564676284790039, -1.7218084335327148, 1.1210594177246094, 3.9639272689819336, 6.806795120239258, 9.649662017822266, 12.492530822753906, 15.33539867401123, 18.178266525268555, 21.021133422851562, 23.864002227783203, 26.706871032714844, 29.54973793029785, 32.39260482788086, 35.2354736328125, 38.07834243774414, 40.92121124267578, 43.764076232910156, 46.6069450378418, 49.44981384277344, 52.29267883300781, 55.13554763793945, 57.978416442871094, 60.821285247802734, 63.664154052734375, 66.50701904296875, 69.34988403320312, 72.19275665283203, 75.0356216430664, 77.87849426269531, 80.72135925292969]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 8.0, 16.0, 29.0, 30.0, 56.0, 84.0, 125.0, 224.0, 343.0, 479.0, 799.0, 1317.0, 2047.0, 3425.0, 5521.0, 9574.0, 16255.0, 28500.0, 50813.0, 93144.0, 173349.0, 270769.0, 175473.0, 94733.0, 51388.0, 28861.0, 16646.0, 9700.0, 5720.0, 3547.0, 2072.0, 1312.0, 800.0, 498.0, 303.0, 218.0, 139.0, 73.0, 53.0, 32.0, 23.0, 22.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.30028533935546875, -0.2907562255859375, -0.28122711181640625, -0.271697998046875, -0.26216888427734375, -0.2526397705078125, -0.24311065673828125, -0.23358154296875, -0.22405242919921875, -0.2145233154296875, -0.20499420166015625, -0.195465087890625, -0.18593597412109375, -0.1764068603515625, -0.16687774658203125, -0.1573486328125, -0.14781951904296875, -0.1382904052734375, -0.12876129150390625, -0.119232177734375, -0.10970306396484375, -0.1001739501953125, -0.09064483642578125, -0.08111572265625, -0.07158660888671875, -0.0620574951171875, -0.05252838134765625, -0.042999267578125, -0.03347015380859375, -0.0239410400390625, -0.01441192626953125, -0.0048828125, 0.00464630126953125, 0.0141754150390625, 0.02370452880859375, 0.033233642578125, 0.04276275634765625, 0.0522918701171875, 0.06182098388671875, 0.07135009765625, 0.08087921142578125, 0.0904083251953125, 0.09993743896484375, 0.109466552734375, 0.11899566650390625, 0.1285247802734375, 0.13805389404296875, 0.1475830078125, 0.15711212158203125, 0.1666412353515625, 0.17617034912109375, 0.185699462890625, 0.19522857666015625, 0.2047576904296875, 0.21428680419921875, 0.22381591796875, 0.23334503173828125, 0.2428741455078125, 0.25240325927734375, 0.261932373046875, 0.27146148681640625, 0.2809906005859375, 0.29051971435546875, 0.300048828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 10.0, 18.0, 22.0, 19.0, 20.0, 38.0, 37.0, 34.0, 34.0, 34.0, 34.0, 35.0, 35.0, 44.0, 1070.0, 45.0, 46.0, 44.0, 55.0, 37.0, 36.0, 24.0, 22.0, 30.0, 31.0, 13.0, 21.0, 13.0, 18.0, 18.0, 15.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -7.998291015625, -7.69189453125, -7.385498046875, -7.0791015625, -6.772705078125, -6.46630859375, -6.159912109375, -5.853515625, -5.547119140625, -5.24072265625, -4.934326171875, -4.6279296875, -4.321533203125, -4.01513671875, -3.708740234375, -3.40234375, -3.095947265625, -2.78955078125, -2.483154296875, -2.1767578125, -1.870361328125, -1.56396484375, -1.257568359375, -0.951171875, -0.644775390625, -0.33837890625, -0.031982421875, 0.2744140625, 0.580810546875, 0.88720703125, 1.193603515625, 1.5, 1.806396484375, 2.11279296875, 2.419189453125, 2.7255859375, 3.031982421875, 3.33837890625, 3.644775390625, 3.951171875, 4.257568359375, 4.56396484375, 4.870361328125, 5.1767578125, 5.483154296875, 5.78955078125, 6.095947265625, 6.40234375, 6.708740234375, 7.01513671875, 7.321533203125, 7.6279296875, 7.934326171875, 8.24072265625, 8.547119140625, 8.853515625, 9.159912109375, 9.46630859375, 9.772705078125, 10.0791015625, 10.385498046875, 10.69189453125, 10.998291015625, 11.3046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 16.0, 24.0, 25.0, 50.0, 64.0, 104.0, 145.0, 231.0, 342.0, 564.0, 772.0, 1160.0, 1711.0, 2705.0, 4252.0, 6413.0, 9911.0, 15485.0, 24226.0, 38638.0, 62463.0, 104673.0, 183509.0, 1280242.0, 140935.0, 81960.0, 49974.0, 31659.0, 19523.0, 12292.0, 7853.0, 5103.0, 3490.0, 2197.0, 1482.0, 947.0, 650.0, 437.0, 316.0, 180.0, 123.0, 97.0, 58.0, 44.0, 30.0, 15.0, 15.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.149658203125, -0.14487266540527344, -0.14008712768554688, -0.1353015899658203, -0.13051605224609375, -0.1257305145263672, -0.12094497680664062, -0.11615943908691406, -0.1113739013671875, -0.10658836364746094, -0.10180282592773438, -0.09701728820800781, -0.09223175048828125, -0.08744621276855469, -0.08266067504882812, -0.07787513732910156, -0.073089599609375, -0.06830406188964844, -0.06351852416992188, -0.05873298645019531, -0.05394744873046875, -0.04916191101074219, -0.044376373291015625, -0.03959083557128906, -0.0348052978515625, -0.030019760131835938, -0.025234222412109375, -0.020448684692382812, -0.01566314697265625, -0.010877609252929688, -0.006092071533203125, -0.0013065338134765625, 0.00347900390625, 0.008264541625976562, 0.013050079345703125, 0.017835617065429688, 0.02262115478515625, 0.027406692504882812, 0.032192230224609375, 0.03697776794433594, 0.0417633056640625, 0.04654884338378906, 0.051334381103515625, 0.05611991882324219, 0.06090545654296875, 0.06569099426269531, 0.07047653198242188, 0.07526206970214844, 0.080047607421875, 0.08483314514160156, 0.08961868286132812, 0.09440422058105469, 0.09918975830078125, 0.10397529602050781, 0.10876083374023438, 0.11354637145996094, 0.1183319091796875, 0.12311744689941406, 0.12790298461914062, 0.1326885223388672, 0.13747406005859375, 0.1422595977783203, 0.14704513549804688, 0.15183067321777344, 0.1566162109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 3.0, 9.0, 4.0, 9.0, 16.0, 17.0, 22.0, 31.0, 18.0, 25.0, 29.0, 36.0, 33.0, 40.0, 51.0, 80.0, 87.0, 91.0, 63.0, 54.0, 36.0, 25.0, 37.0, 27.0, 28.0, 19.0, 21.0, 10.0, 5.0, 5.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00025081634521484375, -0.00024335645139217377, -0.00023589655756950378, -0.0002284366637468338, -0.00022097676992416382, -0.00021351687610149384, -0.00020605698227882385, -0.00019859708845615387, -0.0001911371946334839, -0.0001836773008108139, -0.00017621740698814392, -0.00016875751316547394, -0.00016129761934280396, -0.00015383772552013397, -0.000146377831697464, -0.000138917937874794, -0.00013145804405212402, -0.00012399815022945404, -0.00011653825640678406, -0.00010907836258411407, -0.00010161846876144409, -9.415857493877411e-05, -8.669868111610413e-05, -7.923878729343414e-05, -7.177889347076416e-05, -6.431899964809418e-05, -5.6859105825424194e-05, -4.939921200275421e-05, -4.193931818008423e-05, -3.4479424357414246e-05, -2.7019530534744263e-05, -1.955963671207428e-05, -1.2099742889404297e-05, -4.639849066734314e-06, 2.820044755935669e-06, 1.0279938578605652e-05, 1.7739832401275635e-05, 2.5199726223945618e-05, 3.26596200466156e-05, 4.0119513869285583e-05, 4.7579407691955566e-05, 5.503930151462555e-05, 6.249919533729553e-05, 6.995908915996552e-05, 7.74189829826355e-05, 8.487887680530548e-05, 9.233877062797546e-05, 9.979866445064545e-05, 0.00010725855827331543, 0.00011471845209598541, 0.0001221783459186554, 0.00012963823974132538, 0.00013709813356399536, 0.00014455802738666534, 0.00015201792120933533, 0.0001594778150320053, 0.0001669377088546753, 0.00017439760267734528, 0.00018185749650001526, 0.00018931739032268524, 0.00019677728414535522, 0.0002042371779680252, 0.0002116970717906952, 0.00021915696561336517, 0.00022661685943603516]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 7.0, 11.0, 7.0, 12.0, 18.0, 28.0, 41.0, 38.0, 42.0, 96.0, 121.0, 180.0, 361.0, 854.0, 59077.0, 984710.0, 1652.0, 479.0, 230.0, 133.0, 99.0, 81.0, 39.0, 36.0, 34.0, 33.0, 24.0, 18.0, 9.0, 9.0, 9.0, 5.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054473876953125, -0.00527268648147583, -0.00509798526763916, -0.00492328405380249, -0.00474858283996582, -0.00457388162612915, -0.0043991804122924805, -0.0042244791984558105, -0.004049777984619141, -0.0038750767707824707, -0.0037003755569458008, -0.003525674343109131, -0.003350973129272461, -0.003176271915435791, -0.003001570701599121, -0.002826869487762451, -0.0026521682739257812, -0.0024774670600891113, -0.0023027658462524414, -0.0021280646324157715, -0.0019533634185791016, -0.0017786622047424316, -0.0016039609909057617, -0.0014292597770690918, -0.0012545585632324219, -0.001079857349395752, -0.000905156135559082, -0.0007304549217224121, -0.0005557537078857422, -0.00038105249404907227, -0.00020635128021240234, -3.165006637573242e-05, 0.0001430511474609375, 0.0003177523612976074, 0.0004924535751342773, 0.0006671547889709473, 0.0008418560028076172, 0.0010165572166442871, 0.001191258430480957, 0.001365959644317627, 0.0015406608581542969, 0.0017153620719909668, 0.0018900632858276367, 0.0020647644996643066, 0.0022394657135009766, 0.0024141669273376465, 0.0025888681411743164, 0.0027635693550109863, 0.0029382705688476562, 0.003112971782684326, 0.003287672996520996, 0.003462374210357666, 0.003637075424194336, 0.003811776638031006, 0.003986477851867676, 0.004161179065704346, 0.004335880279541016, 0.0045105814933776855, 0.0046852827072143555, 0.004859983921051025, 0.005034685134887695, 0.005209386348724365, 0.005384087562561035, 0.005558788776397705, 0.005733489990234375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 762.0, 253.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008890714962035418, -0.0006648646667599678, -0.00044065777910873294, -0.00021645089145749807, 7.755937986075878e-06, 0.00023196276742964983, 0.0004561697132885456, 0.0006803765427321196, 0.0009045833721756935, 0.0011287902016192675, 0.0013529970310628414, 0.0015772039769217372, 0.0018014108063653111, 0.002025617752224207, 0.002249824581667781, 0.002474031411111355, 0.0026982382405549288, 0.0029224450699985027, 0.0031466518994420767, 0.0033708587288856506, 0.0035950657911598682, 0.0038192723877727985, 0.004043479450047016, 0.0042676860466599464, 0.004491893108934164, 0.004716100171208382, 0.004940306767821312, 0.0051645138300955296, 0.00538872042670846, 0.0056129274889826775, 0.005837134085595608, 0.006061341147869825, 0.006285548210144043, 0.006509755272418261, 0.006733961869031191, 0.0069581689313054085, 0.007182375527918339, 0.007406582590192556, 0.007630789652466774, 0.007854996249079704, 0.008079202845692635, 0.008303409442305565, 0.00852761697024107, 0.008751823566854, 0.00897603016346693, 0.00920023676007986, 0.009424444288015366, 0.009648650884628296, 0.009872857481241226, 0.010097064077854156, 0.010321271605789661, 0.010545478202402592, 0.010769684799015522, 0.010993891395628452, 0.011218098923563957, 0.011442305520176888, 0.011666513048112392, 0.011890719644725323, 0.012114927172660828, 0.012339133769273758, 0.012563340365886688, 0.012787546962499619, 0.013011754490435123, 0.013235961087048054, 0.013460167683660984]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 8.0, 36.0, 55.0, 79.0, 122.0, 148.0, 142.0, 129.0, 116.0, 69.0, 51.0, 32.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005792379379272461, -0.0005623642355203629, -0.0005454905331134796, -0.0005286168307065964, -0.0005117431282997131, -0.0004948694258928299, -0.00047799572348594666, -0.0004611220210790634, -0.0004442483186721802, -0.00042737461626529694, -0.0004105009138584137, -0.00039362721145153046, -0.0003767535090446472, -0.000359879806637764, -0.00034300610423088074, -0.0003261324018239975, -0.00030925869941711426, -0.000292384997010231, -0.0002755112946033478, -0.00025863759219646454, -0.0002417638897895813, -0.00022489018738269806, -0.00020801648497581482, -0.00019114278256893158, -0.00017426908016204834, -0.0001573953777551651, -0.00014052167534828186, -0.00012364797294139862, -0.00010677427053451538, -8.990056812763214e-05, -7.30268657207489e-05, -5.615316331386566e-05, -3.927946090698242e-05, -2.2405758500099182e-05, -5.532056093215942e-06, 1.1341646313667297e-05, 2.8215348720550537e-05, 4.508905112743378e-05, 6.196275353431702e-05, 7.883645594120026e-05, 9.57101583480835e-05, 0.00011258386075496674, 0.00012945756316184998, 0.00014633126556873322, 0.00016320496797561646, 0.0001800786703824997, 0.00019695237278938293, 0.00021382607519626617, 0.00023069977760314941, 0.00024757348001003265, 0.0002644471824169159, 0.00028132088482379913, 0.0002981945872306824, 0.0003150682896375656, 0.00033194199204444885, 0.0003488156944513321, 0.00036568939685821533, 0.00038256309926509857, 0.0003994368016719818, 0.00041631050407886505, 0.0004331842064857483, 0.00045005790889263153, 0.00046693161129951477, 0.000483805313706398, 0.0005006790161132812]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 4.0, 12.0, 3.0, 27.0, 24.0, 40.0, 42.0, 73.0, 108.0, 157.0, 227.0, 346.0, 516.0, 763.0, 1288.0, 2206.0, 3845.0, 7485.0, 16790.0, 50815.0, 253627.0, 555553.0, 103706.0, 27556.0, 10792.0, 5174.0, 2746.0, 1621.0, 1021.0, 640.0, 457.0, 274.0, 187.0, 133.0, 85.0, 73.0, 45.0, 30.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.09375, -25.308837890625, -24.52392578125, -23.739013671875, -22.9541015625, -22.169189453125, -21.38427734375, -20.599365234375, -19.814453125, -19.029541015625, -18.24462890625, -17.459716796875, -16.6748046875, -15.889892578125, -15.10498046875, -14.320068359375, -13.53515625, -12.750244140625, -11.96533203125, -11.180419921875, -10.3955078125, -9.610595703125, -8.82568359375, -8.040771484375, -7.255859375, -6.470947265625, -5.68603515625, -4.901123046875, -4.1162109375, -3.331298828125, -2.54638671875, -1.761474609375, -0.9765625, -0.191650390625, 0.59326171875, 1.378173828125, 2.1630859375, 2.947998046875, 3.73291015625, 4.517822265625, 5.302734375, 6.087646484375, 6.87255859375, 7.657470703125, 8.4423828125, 9.227294921875, 10.01220703125, 10.797119140625, 11.58203125, 12.366943359375, 13.15185546875, 13.936767578125, 14.7216796875, 15.506591796875, 16.29150390625, 17.076416015625, 17.861328125, 18.646240234375, 19.43115234375, 20.216064453125, 21.0009765625, 21.785888671875, 22.57080078125, 23.355712890625, 24.140625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 13.0, 16.0, 23.0, 15.0, 23.0, 33.0, 23.0, 40.0, 42.0, 43.0, 78.0, 71.0, 204.0, 1592.0, 278.0, 96.0, 64.0, 50.0, 41.0, 33.0, 38.0, 32.0, 37.0, 22.0, 12.0, 20.0, 12.0, 11.0, 13.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-42.125, -41.035400390625, -39.94580078125, -38.856201171875, -37.7666015625, -36.677001953125, -35.58740234375, -34.497802734375, -33.408203125, -32.318603515625, -31.22900390625, -30.139404296875, -29.0498046875, -27.960205078125, -26.87060546875, -25.781005859375, -24.69140625, -23.601806640625, -22.51220703125, -21.422607421875, -20.3330078125, -19.243408203125, -18.15380859375, -17.064208984375, -15.974609375, -14.885009765625, -13.79541015625, -12.705810546875, -11.6162109375, -10.526611328125, -9.43701171875, -8.347412109375, -7.2578125, -6.168212890625, -5.07861328125, -3.989013671875, -2.8994140625, -1.809814453125, -0.72021484375, 0.369384765625, 1.458984375, 2.548583984375, 3.63818359375, 4.727783203125, 5.8173828125, 6.906982421875, 7.99658203125, 9.086181640625, 10.17578125, 11.265380859375, 12.35498046875, 13.444580078125, 14.5341796875, 15.623779296875, 16.71337890625, 17.802978515625, 18.892578125, 19.982177734375, 21.07177734375, 22.161376953125, 23.2509765625, 24.340576171875, 25.43017578125, 26.519775390625, 27.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 13.0, 15.0, 29.0, 36.0, 57.0, 66.0, 108.0, 147.0, 261.0, 468.0, 1336.0, 13897.0, 3086227.0, 39530.0, 2045.0, 553.0, 316.0, 168.0, 113.0, 88.0, 55.0, 38.0, 26.0, 16.0, 14.0, 16.0, 12.0, 10.0, 2.0, 6.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.25, -97.3544921875, -94.458984375, -91.5634765625, -88.66796875, -85.7724609375, -82.876953125, -79.9814453125, -77.0859375, -74.1904296875, -71.294921875, -68.3994140625, -65.50390625, -62.6083984375, -59.712890625, -56.8173828125, -53.921875, -51.0263671875, -48.130859375, -45.2353515625, -42.33984375, -39.4443359375, -36.548828125, -33.6533203125, -30.7578125, -27.8623046875, -24.966796875, -22.0712890625, -19.17578125, -16.2802734375, -13.384765625, -10.4892578125, -7.59375, -4.6982421875, -1.802734375, 1.0927734375, 3.98828125, 6.8837890625, 9.779296875, 12.6748046875, 15.5703125, 18.4658203125, 21.361328125, 24.2568359375, 27.15234375, 30.0478515625, 32.943359375, 35.8388671875, 38.734375, 41.6298828125, 44.525390625, 47.4208984375, 50.31640625, 53.2119140625, 56.107421875, 59.0029296875, 61.8984375, 64.7939453125, 67.689453125, 70.5849609375, 73.48046875, 76.3759765625, 79.271484375, 82.1669921875, 85.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 33.0, 63.0, 120.0, 201.0, 241.0, 152.0, 85.0, 51.0, 19.0, 13.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.17568969726562, -95.25472259521484, -91.33375549316406, -87.41278839111328, -83.4918212890625, -79.57085418701172, -75.64988708496094, -71.72892761230469, -67.80795288085938, -63.886985778808594, -59.96601867675781, -56.04505157470703, -52.12408447265625, -48.20311737060547, -44.28215408325195, -40.36118698120117, -36.440223693847656, -32.519256591796875, -28.598289489746094, -24.677324295043945, -20.756357192993164, -16.835390090942383, -12.914424896240234, -8.993457794189453, -5.072490692138672, -1.1515240669250488, 2.769442558288574, 6.690408706665039, 10.61137580871582, 14.532342910766602, 18.45330810546875, 22.37427520751953, 26.295242309570312, 30.216209411621094, 34.137176513671875, 38.058143615722656, 41.97911071777344, 45.90007781982422, 49.821041107177734, 53.742008209228516, 57.6629753112793, 61.58394241333008, 65.5049057006836, 69.42587280273438, 73.34683990478516, 77.26780700683594, 81.18877410888672, 85.1097412109375, 89.03070831298828, 92.95167541503906, 96.87264251708984, 100.79360961914062, 104.7145767211914, 108.63554382324219, 112.55650329589844, 116.47747802734375, 120.3984375, 124.31940460205078, 128.24037170410156, 132.1613311767578, 136.08230590820312, 140.00326538085938, 143.9242401123047, 147.84519958496094, 151.76617431640625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 10.0, 9.0, 8.0, 10.0, 7.0, 13.0, 6.0, 24.0, 22.0, 20.0, 37.0, 43.0, 33.0, 38.0, 34.0, 33.0, 47.0, 56.0, 41.0, 48.0, 44.0, 44.0, 39.0, 48.0, 41.0, 28.0, 24.0, 30.0, 27.0, 18.0, 18.0, 15.0, 15.0, 11.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-102.04652404785156, -98.91427612304688, -95.78202819824219, -92.6497802734375, -89.51753234863281, -86.38528442382812, -83.25303649902344, -80.12078094482422, -76.98853302001953, -73.85628509521484, -70.72403717041016, -67.59178924560547, -64.45954132080078, -61.32728958129883, -58.19504165649414, -55.06278991699219, -51.930545806884766, -48.79829788208008, -45.66604995727539, -42.53379821777344, -39.40155029296875, -36.26930236816406, -33.137054443359375, -30.004804611206055, -26.872556686401367, -23.74030876159668, -20.60805892944336, -17.475811004638672, -14.343562126159668, -11.211313247680664, -8.079065322875977, -4.946815490722656, -1.8145675659179688, 1.317681074142456, 4.449929714202881, 7.582178115844727, 10.71442699432373, 13.846675872802734, 16.978923797607422, 20.111173629760742, 23.24342155456543, 26.375669479370117, 29.507919311523438, 32.640167236328125, 35.77241516113281, 38.9046630859375, 42.03691101074219, 45.16916275024414, 48.30141067504883, 51.433658599853516, 54.5659065246582, 57.698158264160156, 60.830406188964844, 63.96265411376953, 67.09490203857422, 70.2271499633789, 73.3593978881836, 76.49164581298828, 79.62389373779297, 82.75614166259766, 85.88838958740234, 89.02064514160156, 92.15289306640625, 95.28514099121094, 98.41738891601562]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 2.0, 14.0, 11.0, 11.0, 24.0, 29.0, 23.0, 23.0, 23.0, 41.0, 31.0, 38.0, 39.0, 35.0, 42.0, 61.0, 34.0, 46.0, 57.0, 51.0, 40.0, 39.0, 45.0, 34.0, 37.0, 29.0, 16.0, 27.0, 19.0, 17.0, 7.0, 9.0, 7.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7890625, -14.2735595703125, -13.758056640625, -13.2425537109375, -12.72705078125, -12.2115478515625, -11.696044921875, -11.1805419921875, -10.6650390625, -10.1495361328125, -9.634033203125, -9.1185302734375, -8.60302734375, -8.0875244140625, -7.572021484375, -7.0565185546875, -6.541015625, -6.0255126953125, -5.510009765625, -4.9945068359375, -4.47900390625, -3.9635009765625, -3.447998046875, -2.9324951171875, -2.4169921875, -1.9014892578125, -1.385986328125, -0.8704833984375, -0.35498046875, 0.1605224609375, 0.676025390625, 1.1915283203125, 1.70703125, 2.2225341796875, 2.738037109375, 3.2535400390625, 3.76904296875, 4.2845458984375, 4.800048828125, 5.3155517578125, 5.8310546875, 6.3465576171875, 6.862060546875, 7.3775634765625, 7.89306640625, 8.4085693359375, 8.924072265625, 9.4395751953125, 9.955078125, 10.4705810546875, 10.986083984375, 11.5015869140625, 12.01708984375, 12.5325927734375, 13.048095703125, 13.5635986328125, 14.0791015625, 14.5946044921875, 15.110107421875, 15.6256103515625, 16.14111328125, 16.6566162109375, 17.172119140625, 17.6876220703125, 18.203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 15.0, 31.0, 21.0, 46.0, 68.0, 83.0, 107.0, 141.0, 226.0, 314.0, 407.0, 634.0, 917.0, 1403.0, 2312.0, 4623.0, 14202.0, 134669.0, 1975508.0, 1892413.0, 140661.0, 14063.0, 4569.0, 2373.0, 1411.0, 961.0, 622.0, 435.0, 321.0, 217.0, 134.0, 105.0, 75.0, 39.0, 44.0, 24.0, 23.0, 16.0, 8.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.53125, -34.544189453125, -33.55712890625, -32.570068359375, -31.5830078125, -30.595947265625, -29.60888671875, -28.621826171875, -27.634765625, -26.647705078125, -25.66064453125, -24.673583984375, -23.6865234375, -22.699462890625, -21.71240234375, -20.725341796875, -19.73828125, -18.751220703125, -17.76416015625, -16.777099609375, -15.7900390625, -14.802978515625, -13.81591796875, -12.828857421875, -11.841796875, -10.854736328125, -9.86767578125, -8.880615234375, -7.8935546875, -6.906494140625, -5.91943359375, -4.932373046875, -3.9453125, -2.958251953125, -1.97119140625, -0.984130859375, 0.0029296875, 0.989990234375, 1.97705078125, 2.964111328125, 3.951171875, 4.938232421875, 5.92529296875, 6.912353515625, 7.8994140625, 8.886474609375, 9.87353515625, 10.860595703125, 11.84765625, 12.834716796875, 13.82177734375, 14.808837890625, 15.7958984375, 16.782958984375, 17.77001953125, 18.757080078125, 19.744140625, 20.731201171875, 21.71826171875, 22.705322265625, 23.6923828125, 24.679443359375, 25.66650390625, 26.653564453125, 27.640625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 14.0, 27.0, 29.0, 52.0, 92.0, 102.0, 197.0, 311.0, 586.0, 864.0, 771.0, 417.0, 226.0, 140.0, 77.0, 46.0, 35.0, 22.0, 24.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.828125, -22.825927734375, -21.82373046875, -20.821533203125, -19.8193359375, -18.817138671875, -17.81494140625, -16.812744140625, -15.810546875, -14.808349609375, -13.80615234375, -12.803955078125, -11.8017578125, -10.799560546875, -9.79736328125, -8.795166015625, -7.79296875, -6.790771484375, -5.78857421875, -4.786376953125, -3.7841796875, -2.781982421875, -1.77978515625, -0.777587890625, 0.224609375, 1.226806640625, 2.22900390625, 3.231201171875, 4.2333984375, 5.235595703125, 6.23779296875, 7.239990234375, 8.2421875, 9.244384765625, 10.24658203125, 11.248779296875, 12.2509765625, 13.253173828125, 14.25537109375, 15.257568359375, 16.259765625, 17.261962890625, 18.26416015625, 19.266357421875, 20.2685546875, 21.270751953125, 22.27294921875, 23.275146484375, 24.27734375, 25.279541015625, 26.28173828125, 27.283935546875, 28.2861328125, 29.288330078125, 30.29052734375, 31.292724609375, 32.294921875, 33.297119140625, 34.29931640625, 35.301513671875, 36.3037109375, 37.305908203125, 38.30810546875, 39.310302734375, 40.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 24.0, 29.0, 42.0, 65.0, 136.0, 271.0, 754.0, 3018.0, 25459.0, 2422307.0, 1715122.0, 22746.0, 2814.0, 803.0, 314.0, 150.0, 80.0, 47.0, 32.0, 21.0, 8.0, 13.0, 10.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.3125, -76.4013671875, -74.490234375, -72.5791015625, -70.66796875, -68.7568359375, -66.845703125, -64.9345703125, -63.0234375, -61.1123046875, -59.201171875, -57.2900390625, -55.37890625, -53.4677734375, -51.556640625, -49.6455078125, -47.734375, -45.8232421875, -43.912109375, -42.0009765625, -40.08984375, -38.1787109375, -36.267578125, -34.3564453125, -32.4453125, -30.5341796875, -28.623046875, -26.7119140625, -24.80078125, -22.8896484375, -20.978515625, -19.0673828125, -17.15625, -15.2451171875, -13.333984375, -11.4228515625, -9.51171875, -7.6005859375, -5.689453125, -3.7783203125, -1.8671875, 0.0439453125, 1.955078125, 3.8662109375, 5.77734375, 7.6884765625, 9.599609375, 11.5107421875, 13.421875, 15.3330078125, 17.244140625, 19.1552734375, 21.06640625, 22.9775390625, 24.888671875, 26.7998046875, 28.7109375, 30.6220703125, 32.533203125, 34.4443359375, 36.35546875, 38.2666015625, 40.177734375, 42.0888671875, 44.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 109.0, 420.0, 402.0, 61.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.65985107421875, -206.4739227294922, -194.28799438476562, -182.10208129882812, -169.91615295410156, -157.730224609375, -145.5443115234375, -133.35838317871094, -121.17245483398438, -108.98652648925781, -96.80060577392578, -84.61468505859375, -72.42875671386719, -60.24283218383789, -48.056907653808594, -35.87098693847656, -23.68505859375, -11.499134063720703, 0.6867904663085938, 12.87271499633789, 25.058639526367188, 37.244564056396484, 49.43048858642578, 61.61640930175781, 73.80233764648438, 85.98826599121094, 98.17418670654297, 110.360107421875, 122.54603576660156, 134.73196411132812, 146.91787719726562, 159.1038055419922, 171.28973388671875, 183.4756622314453, 195.66159057617188, 207.84750366210938, 220.03343200683594, 232.2193603515625, 244.4052734375, 256.5911865234375, 268.7771301269531, 280.9630432128906, 293.14898681640625, 305.33489990234375, 317.52081298828125, 329.7067565917969, 341.8926696777344, 354.07861328125, 366.2645263671875, 378.450439453125, 390.6363830566406, 402.8222961425781, 415.00823974609375, 427.19415283203125, 439.38006591796875, 451.56597900390625, 463.7519226074219, 475.9378356933594, 488.123779296875, 500.3096923828125, 512.49560546875, 524.6815185546875, 536.8674926757812, 549.0534057617188, 561.2393188476562]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 7.0, 7.0, 12.0, 16.0, 8.0, 23.0, 20.0, 26.0, 15.0, 32.0, 29.0, 40.0, 35.0, 43.0, 44.0, 35.0, 38.0, 39.0, 46.0, 44.0, 42.0, 46.0, 46.0, 37.0, 32.0, 34.0, 33.0, 23.0, 23.0, 16.0, 8.0, 13.0, 15.0, 9.0, 14.0, 10.0, 7.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.37522888183594, -77.98039245605469, -75.58555603027344, -73.19071960449219, -70.79588317871094, -68.40104675292969, -66.00621032714844, -63.61137008666992, -61.21653366088867, -58.82169723510742, -56.42686080932617, -54.03202438354492, -51.637184143066406, -49.242347717285156, -46.847511291503906, -44.452674865722656, -42.057838439941406, -39.663002014160156, -37.268165588378906, -34.873329162597656, -32.478492736816406, -30.083654403686523, -27.68881607055664, -25.29397964477539, -22.89914321899414, -20.50430679321289, -18.10947036743164, -15.714632034301758, -13.319795608520508, -10.924959182739258, -8.530121803283691, -6.135284423828125, -3.740447998046875, -1.3456110954284668, 1.0492258071899414, 3.4440627098083496, 5.838899612426758, 8.233736038208008, 10.628573417663574, 13.02341079711914, 15.41824722290039, 17.81308364868164, 20.20792007446289, 22.602758407592773, 24.997594833374023, 27.392431259155273, 29.787269592285156, 32.182106018066406, 34.576942443847656, 36.971778869628906, 39.366615295410156, 41.761451721191406, 44.156288146972656, 46.551124572753906, 48.94596481323242, 51.34080123901367, 53.73563766479492, 56.13047409057617, 58.52531051635742, 60.92014694213867, 63.31498718261719, 65.70982360839844, 68.10466003417969, 70.49949645996094, 72.89433288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 11.0, 14.0, 18.0, 28.0, 33.0, 67.0, 93.0, 124.0, 225.0, 296.0, 469.0, 732.0, 1040.0, 1721.0, 2670.0, 4078.0, 6698.0, 10578.0, 17010.0, 26867.0, 44593.0, 73476.0, 124750.0, 223719.0, 211548.0, 117223.0, 69563.0, 41593.0, 25664.0, 16172.0, 10011.0, 6222.0, 3993.0, 2496.0, 1600.0, 1077.0, 708.0, 461.0, 297.0, 221.0, 130.0, 84.0, 51.0, 56.0, 22.0, 17.0, 14.0, 9.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2110595703125, -0.2042388916015625, -0.197418212890625, -0.1905975341796875, -0.18377685546875, -0.1769561767578125, -0.170135498046875, -0.1633148193359375, -0.156494140625, -0.1496734619140625, -0.142852783203125, -0.1360321044921875, -0.12921142578125, -0.1223907470703125, -0.115570068359375, -0.1087493896484375, -0.1019287109375, -0.0951080322265625, -0.088287353515625, -0.0814666748046875, -0.07464599609375, -0.0678253173828125, -0.061004638671875, -0.0541839599609375, -0.04736328125, -0.0405426025390625, -0.033721923828125, -0.0269012451171875, -0.02008056640625, -0.0132598876953125, -0.006439208984375, 0.0003814697265625, 0.0072021484375, 0.0140228271484375, 0.020843505859375, 0.0276641845703125, 0.03448486328125, 0.0413055419921875, 0.048126220703125, 0.0549468994140625, 0.061767578125, 0.0685882568359375, 0.075408935546875, 0.0822296142578125, 0.08905029296875, 0.0958709716796875, 0.102691650390625, 0.1095123291015625, 0.1163330078125, 0.1231536865234375, 0.129974365234375, 0.1367950439453125, 0.14361572265625, 0.1504364013671875, 0.157257080078125, 0.1640777587890625, 0.1708984375, 0.1777191162109375, 0.184539794921875, 0.1913604736328125, 0.19818115234375, 0.2050018310546875, 0.211822509765625, 0.2186431884765625, 0.2254638671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 15.0, 14.0, 22.0, 27.0, 23.0, 23.0, 31.0, 34.0, 35.0, 38.0, 43.0, 52.0, 41.0, 47.0, 1072.0, 44.0, 39.0, 42.0, 36.0, 33.0, 35.0, 31.0, 28.0, 27.0, 30.0, 22.0, 10.0, 20.0, 12.0, 21.0, 10.0, 3.0, 9.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.3912353515625, -8.110595703125, -7.8299560546875, -7.54931640625, -7.2686767578125, -6.988037109375, -6.7073974609375, -6.4267578125, -6.1461181640625, -5.865478515625, -5.5848388671875, -5.30419921875, -5.0235595703125, -4.742919921875, -4.4622802734375, -4.181640625, -3.9010009765625, -3.620361328125, -3.3397216796875, -3.05908203125, -2.7784423828125, -2.497802734375, -2.2171630859375, -1.9365234375, -1.6558837890625, -1.375244140625, -1.0946044921875, -0.81396484375, -0.5333251953125, -0.252685546875, 0.0279541015625, 0.30859375, 0.5892333984375, 0.869873046875, 1.1505126953125, 1.43115234375, 1.7117919921875, 1.992431640625, 2.2730712890625, 2.5537109375, 2.8343505859375, 3.114990234375, 3.3956298828125, 3.67626953125, 3.9569091796875, 4.237548828125, 4.5181884765625, 4.798828125, 5.0794677734375, 5.360107421875, 5.6407470703125, 5.92138671875, 6.2020263671875, 6.482666015625, 6.7633056640625, 7.0439453125, 7.3245849609375, 7.605224609375, 7.8858642578125, 8.16650390625, 8.4471435546875, 8.727783203125, 9.0084228515625, 9.2890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 7.0, 14.0, 25.0, 40.0, 46.0, 75.0, 107.0, 155.0, 228.0, 364.0, 508.0, 776.0, 1308.0, 1840.0, 2731.0, 4153.0, 6305.0, 9780.0, 15446.0, 24691.0, 40232.0, 65637.0, 112469.0, 201314.0, 1277942.0, 131531.0, 75656.0, 45967.0, 28421.0, 17429.0, 11158.0, 7146.0, 4595.0, 3034.0, 2013.0, 1256.0, 851.0, 585.0, 443.0, 310.0, 211.0, 97.0, 68.0, 48.0, 35.0, 25.0, 21.0, 14.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.1337451934814453, -0.12930679321289062, -0.12486839294433594, -0.12042999267578125, -0.11599159240722656, -0.11155319213867188, -0.10711479187011719, -0.1026763916015625, -0.09823799133300781, -0.09379959106445312, -0.08936119079589844, -0.08492279052734375, -0.08048439025878906, -0.07604598999023438, -0.07160758972167969, -0.067169189453125, -0.06273078918457031, -0.058292388916015625, -0.05385398864746094, -0.04941558837890625, -0.04497718811035156, -0.040538787841796875, -0.03610038757324219, -0.0316619873046875, -0.027223587036132812, -0.022785186767578125, -0.018346786499023438, -0.01390838623046875, -0.009469985961914062, -0.005031585693359375, -0.0005931854248046875, 0.00384521484375, 0.008283615112304688, 0.012722015380859375, 0.017160415649414062, 0.02159881591796875, 0.026037216186523438, 0.030475616455078125, 0.03491401672363281, 0.0393524169921875, 0.04379081726074219, 0.048229217529296875, 0.05266761779785156, 0.05710601806640625, 0.06154441833496094, 0.06598281860351562, 0.07042121887207031, 0.074859619140625, 0.07929801940917969, 0.08373641967773438, 0.08817481994628906, 0.09261322021484375, 0.09705162048339844, 0.10149002075195312, 0.10592842102050781, 0.1103668212890625, 0.11480522155761719, 0.11924362182617188, 0.12368202209472656, 0.12812042236328125, 0.13255882263183594, 0.13699722290039062, 0.1414356231689453, 0.1458740234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 5.0, 12.0, 5.0, 17.0, 16.0, 19.0, 24.0, 31.0, 33.0, 49.0, 42.0, 66.0, 62.0, 70.0, 86.0, 63.0, 46.0, 55.0, 39.0, 50.0, 41.0, 21.0, 22.0, 24.0, 27.0, 13.0, 4.0, 4.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001347064971923828, -0.0001301206648349762, -0.00012553483247756958, -0.00012094900012016296, -0.00011636316776275635, -0.00011177733540534973, -0.00010719150304794312, -0.0001026056706905365, -9.801983833312988e-05, -9.343400597572327e-05, -8.884817361831665e-05, -8.426234126091003e-05, -7.967650890350342e-05, -7.50906765460968e-05, -7.050484418869019e-05, -6.591901183128357e-05, -6.133317947387695e-05, -5.674734711647034e-05, -5.216151475906372e-05, -4.7575682401657104e-05, -4.298985004425049e-05, -3.840401768684387e-05, -3.3818185329437256e-05, -2.923235297203064e-05, -2.4646520614624023e-05, -2.0060688257217407e-05, -1.547485589981079e-05, -1.0889023542404175e-05, -6.303191184997559e-06, -1.7173588275909424e-06, 2.868473529815674e-06, 7.45430588722229e-06, 1.2040138244628906e-05, 1.6625970602035522e-05, 2.121180295944214e-05, 2.5797635316848755e-05, 3.038346767425537e-05, 3.496930003166199e-05, 3.9555132389068604e-05, 4.414096474647522e-05, 4.8726797103881836e-05, 5.331262946128845e-05, 5.789846181869507e-05, 6.248429417610168e-05, 6.70701265335083e-05, 7.165595889091492e-05, 7.624179124832153e-05, 8.082762360572815e-05, 8.541345596313477e-05, 8.999928832054138e-05, 9.4585120677948e-05, 9.917095303535461e-05, 0.00010375678539276123, 0.00010834261775016785, 0.00011292845010757446, 0.00011751428246498108, 0.0001221001148223877, 0.0001266859471797943, 0.00013127177953720093, 0.00013585761189460754, 0.00014044344425201416, 0.00014502927660942078, 0.0001496151089668274, 0.000154200941324234, 0.00015878677368164062]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 11.0, 6.0, 12.0, 21.0, 39.0, 27.0, 40.0, 72.0, 104.0, 139.0, 233.0, 446.0, 1320.0, 152831.0, 889387.0, 2443.0, 537.0, 282.0, 170.0, 113.0, 76.0, 43.0, 39.0, 32.0, 24.0, 13.0, 12.0, 10.0, 10.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0034618377685546875, -0.003360360860824585, -0.0032588839530944824, -0.00315740704536438, -0.0030559301376342773, -0.002954453229904175, -0.0028529763221740723, -0.0027514994144439697, -0.002650022506713867, -0.0025485455989837646, -0.002447068691253662, -0.0023455917835235596, -0.002244114875793457, -0.0021426379680633545, -0.002041161060333252, -0.0019396841526031494, -0.0018382072448730469, -0.0017367303371429443, -0.0016352534294128418, -0.0015337765216827393, -0.0014322996139526367, -0.0013308227062225342, -0.0012293457984924316, -0.001127868890762329, -0.0010263919830322266, -0.000924915075302124, -0.0008234381675720215, -0.0007219612598419189, -0.0006204843521118164, -0.0005190074443817139, -0.00041753053665161133, -0.0003160536289215088, -0.00021457672119140625, -0.00011309981346130371, -1.1622905731201172e-05, 8.985400199890137e-05, 0.0001913309097290039, 0.00029280781745910645, 0.000394284725189209, 0.0004957616329193115, 0.0005972385406494141, 0.0006987154483795166, 0.0008001923561096191, 0.0009016692638397217, 0.0010031461715698242, 0.0011046230792999268, 0.0012060999870300293, 0.0013075768947601318, 0.0014090538024902344, 0.001510530710220337, 0.0016120076179504395, 0.001713484525680542, 0.0018149614334106445, 0.001916438341140747, 0.0020179152488708496, 0.002119392156600952, 0.0022208690643310547, 0.0023223459720611572, 0.0024238228797912598, 0.0025252997875213623, 0.002626776695251465, 0.0027282536029815674, 0.00282973051071167, 0.0029312074184417725, 0.003032684326171875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 106.0, 909.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045334320748224854, -0.0003064321062993258, -0.0001595210051164031, -1.2609903933480382e-05, 0.00013430119724944234, 0.0002812123275361955, 0.0004281233996152878, 0.00057503447169438, 0.0007219456019811332, 0.0008688566740602255, 0.0010157678043469787, 0.0011626789346337318, 0.0013095899485051632, 0.0014565011952072382, 0.0016034122090786695, 0.001750323222950101, 0.001897234469652176, 0.0020441454835236073, 0.0021910567302256823, 0.0023379677440971136, 0.0024848789907991886, 0.00263179000467062, 0.0027787010185420513, 0.0029256120324134827, 0.0030725232791155577, 0.003219434292986989, 0.003366345539689064, 0.0035132565535604954, 0.0036601675674319267, 0.0038070788141340017, 0.003953990060836077, 0.004100901074707508, 0.004247811622917652, 0.0043947226367890835, 0.004541633650660515, 0.0046885451301932335, 0.004835456144064665, 0.004982367157936096, 0.0051292781718075275, 0.005276189185678959, 0.0054231006652116776, 0.005570011679083109, 0.00571692269295454, 0.005863834172487259, 0.00601074518635869, 0.006157656200230122, 0.006304567214101553, 0.006451478227972984, 0.006598389241844416, 0.006745300255715847, 0.006892211269587278, 0.007039122749119997, 0.007186033762991428, 0.00733294477686286, 0.007479855790734291, 0.007626766804605722, 0.007773677818477154, 0.007920589298009872, 0.008067499846220016, 0.008214411325752735, 0.00836132187396288, 0.008508233353495598, 0.008655144833028316, 0.00880205538123846, 0.00894896686077118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 17.0, 21.0, 56.0, 89.0, 147.0, 174.0, 178.0, 133.0, 100.0, 51.0, 24.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040650367736816406, -0.0003951890394091606, -0.00038387440145015717, -0.0003725597634911537, -0.00036124512553215027, -0.0003499304875731468, -0.00033861584961414337, -0.0003273012116551399, -0.0003159865736961365, -0.000304671935737133, -0.0002933572977781296, -0.00028204265981912613, -0.0002707280218601227, -0.00025941338390111923, -0.0002480987459421158, -0.00023678410798311234, -0.0002254694700241089, -0.00021415483206510544, -0.000202840194106102, -0.00019152555614709854, -0.0001802109181880951, -0.00016889628022909164, -0.0001575816422700882, -0.00014626700431108475, -0.0001349523663520813, -0.00012363772839307785, -0.0001123230904340744, -0.00010100845247507095, -8.96938145160675e-05, -7.837917655706406e-05, -6.706453859806061e-05, -5.574990063905716e-05, -4.443526268005371e-05, -3.312062472105026e-05, -2.1805986762046814e-05, -1.0491348803043365e-05, 8.23289155960083e-07, 1.2137927114963531e-05, 2.345256507396698e-05, 3.476720303297043e-05, 4.608184099197388e-05, 5.7396478950977325e-05, 6.871111690998077e-05, 8.002575486898422e-05, 9.134039282798767e-05, 0.00010265503078699112, 0.00011396966874599457, 0.00012528430670499802, 0.00013659894466400146, 0.0001479135826230049, 0.00015922822058200836, 0.0001705428585410118, 0.00018185749650001526, 0.0001931721344590187, 0.00020448677241802216, 0.0002158014103770256, 0.00022711604833602905, 0.0002384306862950325, 0.00024974532425403595, 0.0002610599622130394, 0.00027237460017204285, 0.0002836892381310463, 0.00029500387609004974, 0.0003063185140490532, 0.00031763315200805664]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 13.0, 12.0, 29.0, 30.0, 42.0, 55.0, 84.0, 132.0, 187.0, 338.0, 606.0, 1086.0, 2269.0, 5365.0, 16682.0, 92460.0, 696774.0, 192545.0, 26369.0, 7386.0, 2857.0, 1376.0, 731.0, 425.0, 228.0, 137.0, 97.0, 64.0, 46.0, 33.0, 18.0, 22.0, 11.0, 9.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.539306640625, -20.81298828125, -20.086669921875, -19.3603515625, -18.634033203125, -17.90771484375, -17.181396484375, -16.455078125, -15.728759765625, -15.00244140625, -14.276123046875, -13.5498046875, -12.823486328125, -12.09716796875, -11.370849609375, -10.64453125, -9.918212890625, -9.19189453125, -8.465576171875, -7.7392578125, -7.012939453125, -6.28662109375, -5.560302734375, -4.833984375, -4.107666015625, -3.38134765625, -2.655029296875, -1.9287109375, -1.202392578125, -0.47607421875, 0.250244140625, 0.9765625, 1.702880859375, 2.42919921875, 3.155517578125, 3.8818359375, 4.608154296875, 5.33447265625, 6.060791015625, 6.787109375, 7.513427734375, 8.23974609375, 8.966064453125, 9.6923828125, 10.418701171875, 11.14501953125, 11.871337890625, 12.59765625, 13.323974609375, 14.05029296875, 14.776611328125, 15.5029296875, 16.229248046875, 16.95556640625, 17.681884765625, 18.408203125, 19.134521484375, 19.86083984375, 20.587158203125, 21.3134765625, 22.039794921875, 22.76611328125, 23.492431640625, 24.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 9.0, 14.0, 12.0, 15.0, 26.0, 19.0, 30.0, 18.0, 30.0, 42.0, 51.0, 75.0, 88.0, 185.0, 1560.0, 322.0, 120.0, 81.0, 53.0, 51.0, 43.0, 28.0, 29.0, 18.0, 23.0, 17.0, 17.0, 14.0, 20.0, 6.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.125, -29.146484375, -28.16796875, -27.189453125, -26.2109375, -25.232421875, -24.25390625, -23.275390625, -22.296875, -21.318359375, -20.33984375, -19.361328125, -18.3828125, -17.404296875, -16.42578125, -15.447265625, -14.46875, -13.490234375, -12.51171875, -11.533203125, -10.5546875, -9.576171875, -8.59765625, -7.619140625, -6.640625, -5.662109375, -4.68359375, -3.705078125, -2.7265625, -1.748046875, -0.76953125, 0.208984375, 1.1875, 2.166015625, 3.14453125, 4.123046875, 5.1015625, 6.080078125, 7.05859375, 8.037109375, 9.015625, 9.994140625, 10.97265625, 11.951171875, 12.9296875, 13.908203125, 14.88671875, 15.865234375, 16.84375, 17.822265625, 18.80078125, 19.779296875, 20.7578125, 21.736328125, 22.71484375, 23.693359375, 24.671875, 25.650390625, 26.62890625, 27.607421875, 28.5859375, 29.564453125, 30.54296875, 31.521484375, 32.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 10.0, 7.0, 21.0, 18.0, 25.0, 25.0, 27.0, 46.0, 75.0, 134.0, 245.0, 470.0, 1249.0, 62772.0, 3076171.0, 2940.0, 695.0, 309.0, 157.0, 81.0, 56.0, 39.0, 31.0, 28.0, 19.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.9375, -83.3505859375, -80.763671875, -78.1767578125, -75.58984375, -73.0029296875, -70.416015625, -67.8291015625, -65.2421875, -62.6552734375, -60.068359375, -57.4814453125, -54.89453125, -52.3076171875, -49.720703125, -47.1337890625, -44.546875, -41.9599609375, -39.373046875, -36.7861328125, -34.19921875, -31.6123046875, -29.025390625, -26.4384765625, -23.8515625, -21.2646484375, -18.677734375, -16.0908203125, -13.50390625, -10.9169921875, -8.330078125, -5.7431640625, -3.15625, -0.5693359375, 2.017578125, 4.6044921875, 7.19140625, 9.7783203125, 12.365234375, 14.9521484375, 17.5390625, 20.1259765625, 22.712890625, 25.2998046875, 27.88671875, 30.4736328125, 33.060546875, 35.6474609375, 38.234375, 40.8212890625, 43.408203125, 45.9951171875, 48.58203125, 51.1689453125, 53.755859375, 56.3427734375, 58.9296875, 61.5166015625, 64.103515625, 66.6904296875, 69.27734375, 71.8642578125, 74.451171875, 77.0380859375, 79.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 198.0, 711.0, 88.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34883117675781, -27.304141998291016, -19.259450912475586, -11.214759826660156, -3.1700706481933594, 4.8746185302734375, 12.9193115234375, 20.964000701904297, 29.008689880371094, 37.05337905883789, 45.09806823730469, 53.14276123046875, 61.18745040893555, 69.23213958740234, 77.2768325805664, 85.32151794433594, 93.3662109375, 101.41090393066406, 109.4555892944336, 117.50028228759766, 125.54496765136719, 133.58966064453125, 141.6343536376953, 149.67904663085938, 157.72372436523438, 165.76841735839844, 173.8131103515625, 181.8577880859375, 189.90248107910156, 197.94717407226562, 205.9918670654297, 214.03656005859375, 222.08126831054688, 230.12596130371094, 238.170654296875, 246.21533203125, 254.26002502441406, 262.3047180175781, 270.34942626953125, 278.39410400390625, 286.43878173828125, 294.48345947265625, 302.5281677246094, 310.5728454589844, 318.6175537109375, 326.6622314453125, 334.7069091796875, 342.7516174316406, 350.79632568359375, 358.84100341796875, 366.8857116699219, 374.9303894042969, 382.97509765625, 391.019775390625, 399.064453125, 407.1091613769531, 415.1538391113281, 423.1985168457031, 431.24322509765625, 439.28790283203125, 447.3326110839844, 455.3772888183594, 463.4219970703125, 471.4666748046875, 479.5113525390625]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 11.0, 14.0, 11.0, 19.0, 26.0, 19.0, 28.0, 27.0, 31.0, 30.0, 37.0, 44.0, 34.0, 44.0, 45.0, 48.0, 46.0, 42.0, 39.0, 37.0, 38.0, 46.0, 23.0, 42.0, 42.0, 25.0, 26.0, 22.0, 24.0, 12.0, 17.0, 9.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-81.09115600585938, -78.91677856445312, -76.74239349365234, -74.5680160522461, -72.39363098144531, -70.21925354003906, -68.04486846923828, -65.87049102783203, -63.69610595703125, -61.521724700927734, -59.34734344482422, -57.1729621887207, -54.99858093261719, -52.82419967651367, -50.649818420410156, -48.475440979003906, -46.30105972290039, -44.126678466796875, -41.95229721069336, -39.777915954589844, -37.60353469848633, -35.42915344238281, -33.25477600097656, -31.080392837524414, -28.9060115814209, -26.731630325317383, -24.557249069213867, -22.382869720458984, -20.20848846435547, -18.034107208251953, -15.859725952148438, -13.685344696044922, -11.510963439941406, -9.33658218383789, -7.162201404571533, -4.987820625305176, -2.81343936920166, -0.6390581130981445, 1.5353221893310547, 3.7097034454345703, 5.884084701538086, 8.058465957641602, 10.232847213745117, 12.407227516174316, 14.581608772277832, 16.75598907470703, 18.930370330810547, 21.104751586914062, 23.279132843017578, 25.453514099121094, 27.62789535522461, 29.802276611328125, 31.97665786743164, 34.151039123535156, 36.325416564941406, 38.49980163574219, 40.67417907714844, 42.84856033325195, 45.02294158935547, 47.197322845458984, 49.3717041015625, 51.546085357666016, 53.72046661376953, 55.89484405517578, 58.06922912597656]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 12.0, 14.0, 18.0, 11.0, 23.0, 19.0, 14.0, 26.0, 29.0, 40.0, 41.0, 38.0, 57.0, 36.0, 49.0, 45.0, 42.0, 40.0, 47.0, 54.0, 40.0, 43.0, 40.0, 30.0, 33.0, 24.0, 19.0, 24.0, 15.0, 12.0, 13.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.8814697265625, -13.419189453125, -12.9569091796875, -12.49462890625, -12.0323486328125, -11.570068359375, -11.1077880859375, -10.6455078125, -10.1832275390625, -9.720947265625, -9.2586669921875, -8.79638671875, -8.3341064453125, -7.871826171875, -7.4095458984375, -6.947265625, -6.4849853515625, -6.022705078125, -5.5604248046875, -5.09814453125, -4.6358642578125, -4.173583984375, -3.7113037109375, -3.2490234375, -2.7867431640625, -2.324462890625, -1.8621826171875, -1.39990234375, -0.9376220703125, -0.475341796875, -0.0130615234375, 0.44921875, 0.9114990234375, 1.373779296875, 1.8360595703125, 2.29833984375, 2.7606201171875, 3.222900390625, 3.6851806640625, 4.1474609375, 4.6097412109375, 5.072021484375, 5.5343017578125, 5.99658203125, 6.4588623046875, 6.921142578125, 7.3834228515625, 7.845703125, 8.3079833984375, 8.770263671875, 9.2325439453125, 9.69482421875, 10.1571044921875, 10.619384765625, 11.0816650390625, 11.5439453125, 12.0062255859375, 12.468505859375, 12.9307861328125, 13.39306640625, 13.8553466796875, 14.317626953125, 14.7799072265625, 15.2421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 1.0, 5.0, 5.0, 6.0, 10.0, 24.0, 24.0, 38.0, 38.0, 46.0, 83.0, 120.0, 143.0, 190.0, 312.0, 422.0, 744.0, 1362.0, 2850.0, 7877.0, 32414.0, 1099880.0, 2970339.0, 57973.0, 11410.0, 3876.0, 1641.0, 837.0, 510.0, 334.0, 226.0, 146.0, 108.0, 89.0, 61.0, 41.0, 34.0, 25.0, 17.0, 12.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6875, -64.4755859375, -62.263671875, -60.0517578125, -57.83984375, -55.6279296875, -53.416015625, -51.2041015625, -48.9921875, -46.7802734375, -44.568359375, -42.3564453125, -40.14453125, -37.9326171875, -35.720703125, -33.5087890625, -31.296875, -29.0849609375, -26.873046875, -24.6611328125, -22.44921875, -20.2373046875, -18.025390625, -15.8134765625, -13.6015625, -11.3896484375, -9.177734375, -6.9658203125, -4.75390625, -2.5419921875, -0.330078125, 1.8818359375, 4.09375, 6.3056640625, 8.517578125, 10.7294921875, 12.94140625, 15.1533203125, 17.365234375, 19.5771484375, 21.7890625, 24.0009765625, 26.212890625, 28.4248046875, 30.63671875, 32.8486328125, 35.060546875, 37.2724609375, 39.484375, 41.6962890625, 43.908203125, 46.1201171875, 48.33203125, 50.5439453125, 52.755859375, 54.9677734375, 57.1796875, 59.3916015625, 61.603515625, 63.8154296875, 66.02734375, 68.2392578125, 70.451171875, 72.6630859375, 74.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 12.0, 7.0, 17.0, 25.0, 28.0, 37.0, 44.0, 55.0, 86.0, 111.0, 190.0, 236.0, 433.0, 630.0, 655.0, 510.0, 327.0, 183.0, 148.0, 90.0, 63.0, 40.0, 38.0, 26.0, 23.0, 21.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-33.53125, -32.65478515625, -31.7783203125, -30.90185546875, -30.025390625, -29.14892578125, -28.2724609375, -27.39599609375, -26.51953125, -25.64306640625, -24.7666015625, -23.89013671875, -23.013671875, -22.13720703125, -21.2607421875, -20.38427734375, -19.5078125, -18.63134765625, -17.7548828125, -16.87841796875, -16.001953125, -15.12548828125, -14.2490234375, -13.37255859375, -12.49609375, -11.61962890625, -10.7431640625, -9.86669921875, -8.990234375, -8.11376953125, -7.2373046875, -6.36083984375, -5.484375, -4.60791015625, -3.7314453125, -2.85498046875, -1.978515625, -1.10205078125, -0.2255859375, 0.65087890625, 1.52734375, 2.40380859375, 3.2802734375, 4.15673828125, 5.033203125, 5.90966796875, 6.7861328125, 7.66259765625, 8.5390625, 9.41552734375, 10.2919921875, 11.16845703125, 12.044921875, 12.92138671875, 13.7978515625, 14.67431640625, 15.55078125, 16.42724609375, 17.3037109375, 18.18017578125, 19.056640625, 19.93310546875, 20.8095703125, 21.68603515625, 22.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 19.0, 37.0, 62.0, 152.0, 331.0, 969.0, 2963.0, 9701.0, 38964.0, 253093.0, 3273127.0, 534690.0, 60286.0, 13874.0, 3844.0, 1303.0, 455.0, 200.0, 100.0, 47.0, 25.0, 17.0, 6.0, 0.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.4228515625, -31.158203125, -29.8935546875, -28.62890625, -27.3642578125, -26.099609375, -24.8349609375, -23.5703125, -22.3056640625, -21.041015625, -19.7763671875, -18.51171875, -17.2470703125, -15.982421875, -14.7177734375, -13.453125, -12.1884765625, -10.923828125, -9.6591796875, -8.39453125, -7.1298828125, -5.865234375, -4.6005859375, -3.3359375, -2.0712890625, -0.806640625, 0.4580078125, 1.72265625, 2.9873046875, 4.251953125, 5.5166015625, 6.78125, 8.0458984375, 9.310546875, 10.5751953125, 11.83984375, 13.1044921875, 14.369140625, 15.6337890625, 16.8984375, 18.1630859375, 19.427734375, 20.6923828125, 21.95703125, 23.2216796875, 24.486328125, 25.7509765625, 27.015625, 28.2802734375, 29.544921875, 30.8095703125, 32.07421875, 33.3388671875, 34.603515625, 35.8681640625, 37.1328125, 38.3974609375, 39.662109375, 40.9267578125, 42.19140625, 43.4560546875, 44.720703125, 45.9853515625, 47.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 1.0, 5.0, 6.0, 16.0, 7.0, 9.0, 17.0, 16.0, 35.0, 39.0, 35.0, 39.0, 55.0, 53.0, 57.0, 75.0, 70.0, 68.0, 66.0, 62.0, 47.0, 38.0, 37.0, 28.0, 24.0, 22.0, 14.0, 13.0, 13.0, 12.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.01224517822266, -100.30632781982422, -96.60041809082031, -92.89450073242188, -89.18858337402344, -85.482666015625, -81.7767562866211, -78.07083892822266, -74.36492919921875, -70.65901184082031, -66.9531021118164, -63.24718475341797, -59.54126739501953, -55.83535385131836, -52.12944030761719, -48.42352294921875, -44.71760559082031, -41.01169204711914, -37.3057746887207, -33.59986114501953, -29.893945693969727, -26.188030242919922, -22.48211669921875, -18.776201248168945, -15.07028579711914, -11.364370346069336, -7.658455848693848, -3.9525413513183594, -0.2466259002685547, 3.45928955078125, 7.165203094482422, 10.871118545532227, 14.577041625976562, 18.282957077026367, 21.988872528076172, 25.694786071777344, 29.40070152282715, 33.10661697387695, 36.812530517578125, 40.51844787597656, 44.224361419677734, 47.930274963378906, 51.636192321777344, 55.342105865478516, 59.04801940917969, 62.753936767578125, 66.45985412597656, 70.16576385498047, 73.8716812133789, 77.57759857177734, 81.28350830078125, 84.98942565917969, 88.69534301757812, 92.40126037597656, 96.10717010498047, 99.8130874633789, 103.51899719238281, 107.22491455078125, 110.93082427978516, 114.6367416381836, 118.34265899658203, 122.04856872558594, 125.75448608398438, 129.4604034423828, 133.16632080078125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 5.0, 8.0, 12.0, 15.0, 17.0, 13.0, 23.0, 21.0, 22.0, 41.0, 25.0, 42.0, 32.0, 37.0, 35.0, 32.0, 27.0, 46.0, 44.0, 32.0, 28.0, 36.0, 48.0, 27.0, 37.0, 27.0, 30.0, 42.0, 26.0, 27.0, 21.0, 20.0, 17.0, 8.0, 6.0, 5.0, 9.0, 10.0, 5.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-107.6094970703125, -104.57537841796875, -101.541259765625, -98.50714111328125, -95.47303009033203, -92.43891143798828, -89.40479278564453, -86.37067413330078, -83.33656311035156, -80.30244445800781, -77.26832580566406, -74.23420715332031, -71.2000961303711, -68.16597747802734, -65.1318588256836, -62.097740173339844, -59.063621520996094, -56.029502868652344, -52.99538803100586, -49.96126937866211, -46.927154541015625, -43.893035888671875, -40.858917236328125, -37.824798583984375, -34.79068374633789, -31.756567001342773, -28.722450256347656, -25.688331604003906, -22.65421485900879, -19.620098114013672, -16.585979461669922, -13.551862716674805, -10.517738342285156, -7.483621120452881, -4.4495038986206055, -1.4153861999511719, 1.6187305450439453, 4.6528472900390625, 7.6869659423828125, 10.72108268737793, 13.755199432373047, 16.789316177368164, 19.82343292236328, 22.85755157470703, 25.89166831970215, 28.925785064697266, 31.959903717041016, 34.9940185546875, 38.02813720703125, 41.062255859375, 44.096370697021484, 47.130489349365234, 50.16460418701172, 53.19872283935547, 56.23284149169922, 59.26696014404297, 62.30107498168945, 65.33518981933594, 68.36930847167969, 71.40342712402344, 74.43754577636719, 77.47166442871094, 80.50578308105469, 83.5398941040039, 86.57401275634766]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 4.0, 17.0, 17.0, 11.0, 10.0, 21.0, 22.0, 22.0, 30.0, 30.0, 34.0, 36.0, 40.0, 33.0, 35.0, 38.0, 43.0, 41.0, 36.0, 27.0, 40.0, 47.0, 34.0, 29.0, 37.0, 34.0, 32.0, 32.0, 27.0, 22.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.5, -169.81640625, -164.1328125, -158.44921875, -152.765625, -147.08203125, -141.3984375, -135.71484375, -130.03125, -124.34765625, -118.6640625, -112.98046875, -107.296875, -101.61328125, -95.9296875, -90.24609375, -84.5625, -78.87890625, -73.1953125, -67.51171875, -61.828125, -56.14453125, -50.4609375, -44.77734375, -39.09375, -33.41015625, -27.7265625, -22.04296875, -16.359375, -10.67578125, -4.9921875, 0.69140625, 6.375, 12.05859375, 17.7421875, 23.42578125, 29.109375, 34.79296875, 40.4765625, 46.16015625, 51.84375, 57.52734375, 63.2109375, 68.89453125, 74.578125, 80.26171875, 85.9453125, 91.62890625, 97.3125, 102.99609375, 108.6796875, 114.36328125, 120.046875, 125.73046875, 131.4140625, 137.09765625, 142.78125, 148.46484375, 154.1484375, 159.83203125, 165.515625, 171.19921875, 176.8828125, 182.56640625, 188.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 10.0, 17.0, 18.0, 25.0, 31.0, 61.0, 101.0, 113.0, 156.0, 229.0, 361.0, 498.0, 717.0, 1035.0, 1420.0, 2037.0, 3037.0, 4314.0, 6322.0, 9506.0, 14239.0, 22002.0, 34786.0, 55485.0, 90977.0, 154749.0, 234883.0, 158348.0, 93587.0, 56694.0, 34991.0, 22459.0, 14764.0, 9735.0, 6562.0, 4386.0, 2934.0, 2110.0, 1494.0, 1014.0, 718.0, 523.0, 340.0, 232.0, 155.0, 120.0, 86.0, 55.0, 34.0, 30.0, 21.0, 15.0, 12.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03125, -2.935089111328125, -2.83892822265625, -2.742767333984375, -2.6466064453125, -2.550445556640625, -2.45428466796875, -2.358123779296875, -2.261962890625, -2.165802001953125, -2.06964111328125, -1.973480224609375, -1.8773193359375, -1.781158447265625, -1.68499755859375, -1.588836669921875, -1.49267578125, -1.396514892578125, -1.30035400390625, -1.204193115234375, -1.1080322265625, -1.011871337890625, -0.91571044921875, -0.819549560546875, -0.723388671875, -0.627227783203125, -0.53106689453125, -0.434906005859375, -0.3387451171875, -0.242584228515625, -0.14642333984375, -0.050262451171875, 0.0458984375, 0.142059326171875, 0.23822021484375, 0.334381103515625, 0.4305419921875, 0.526702880859375, 0.62286376953125, 0.719024658203125, 0.815185546875, 0.911346435546875, 1.00750732421875, 1.103668212890625, 1.1998291015625, 1.295989990234375, 1.39215087890625, 1.488311767578125, 1.58447265625, 1.680633544921875, 1.77679443359375, 1.872955322265625, 1.9691162109375, 2.065277099609375, 2.16143798828125, 2.257598876953125, 2.353759765625, 2.449920654296875, 2.54608154296875, 2.642242431640625, 2.7384033203125, 2.834564208984375, 2.93072509765625, 3.026885986328125, 3.123046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 12.0, 11.0, 15.0, 15.0, 20.0, 19.0, 19.0, 20.0, 26.0, 33.0, 41.0, 27.0, 30.0, 34.0, 20.0, 43.0, 38.0, 40.0, 1066.0, 36.0, 37.0, 37.0, 39.0, 35.0, 31.0, 31.0, 31.0, 21.0, 27.0, 20.0, 17.0, 11.0, 17.0, 6.0, 16.0, 9.0, 6.0, 3.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.90625, -98.3125, -94.71875, -91.125, -87.53125, -83.9375, -80.34375, -76.75, -73.15625, -69.5625, -65.96875, -62.375, -58.78125, -55.1875, -51.59375, -48.0, -44.40625, -40.8125, -37.21875, -33.625, -30.03125, -26.4375, -22.84375, -19.25, -15.65625, -12.0625, -8.46875, -4.875, -1.28125, 2.3125, 5.90625, 9.5, 13.09375, 16.6875, 20.28125, 23.875, 27.46875, 31.0625, 34.65625, 38.25, 41.84375, 45.4375, 49.03125, 52.625, 56.21875, 59.8125, 63.40625, 67.0, 70.59375, 74.1875, 77.78125, 81.375, 84.96875, 88.5625, 92.15625, 95.75, 99.34375, 102.9375, 106.53125, 110.125, 113.71875, 117.3125, 120.90625, 124.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 13.0, 18.0, 33.0, 58.0, 78.0, 105.0, 162.0, 237.0, 317.0, 447.0, 632.0, 927.0, 1233.0, 1803.0, 2566.0, 3621.0, 5185.0, 7602.0, 11328.0, 16940.0, 26139.0, 39986.0, 63882.0, 102945.0, 172299.0, 1261305.0, 139008.0, 84260.0, 53068.0, 33758.0, 21715.0, 14265.0, 9726.0, 6539.0, 4498.0, 3014.0, 2131.0, 1498.0, 1057.0, 808.0, 590.0, 443.0, 299.0, 197.0, 148.0, 80.0, 57.0, 35.0, 28.0, 21.0, 10.0, 5.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.799957275390625, -1.74053955078125, -1.681121826171875, -1.6217041015625, -1.562286376953125, -1.50286865234375, -1.443450927734375, -1.384033203125, -1.324615478515625, -1.26519775390625, -1.205780029296875, -1.1463623046875, -1.086944580078125, -1.02752685546875, -0.968109130859375, -0.90869140625, -0.849273681640625, -0.78985595703125, -0.730438232421875, -0.6710205078125, -0.611602783203125, -0.55218505859375, -0.492767333984375, -0.433349609375, -0.373931884765625, -0.31451416015625, -0.255096435546875, -0.1956787109375, -0.136260986328125, -0.07684326171875, -0.017425537109375, 0.0419921875, 0.101409912109375, 0.16082763671875, 0.220245361328125, 0.2796630859375, 0.339080810546875, 0.39849853515625, 0.457916259765625, 0.517333984375, 0.576751708984375, 0.63616943359375, 0.695587158203125, 0.7550048828125, 0.814422607421875, 0.87384033203125, 0.933258056640625, 0.99267578125, 1.052093505859375, 1.11151123046875, 1.170928955078125, 1.2303466796875, 1.289764404296875, 1.34918212890625, 1.408599853515625, 1.468017578125, 1.527435302734375, 1.58685302734375, 1.646270751953125, 1.7056884765625, 1.765106201171875, 1.82452392578125, 1.883941650390625, 1.943359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 6.0, 6.0, 17.0, 16.0, 17.0, 22.0, 28.0, 41.0, 42.0, 48.0, 101.0, 213.0, 146.0, 55.0, 54.0, 40.0, 21.0, 30.0, 25.0, 12.0, 6.0, 11.0, 7.0, 3.0, 9.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005252838134765625, -0.005087316036224365, -0.0049217939376831055, -0.004756271839141846, -0.004590749740600586, -0.004425227642059326, -0.004259705543518066, -0.004094183444976807, -0.003928661346435547, -0.003763139247894287, -0.0035976171493530273, -0.0034320950508117676, -0.003266572952270508, -0.003101050853729248, -0.0029355287551879883, -0.0027700066566467285, -0.0026044845581054688, -0.002438962459564209, -0.0022734403610229492, -0.0021079182624816895, -0.0019423961639404297, -0.00177687406539917, -0.0016113519668579102, -0.0014458298683166504, -0.0012803077697753906, -0.0011147856712341309, -0.0009492635726928711, -0.0007837414741516113, -0.0006182193756103516, -0.0004526972770690918, -0.00028717517852783203, -0.00012165307998657227, 4.38690185546875e-05, 0.00020939111709594727, 0.00037491321563720703, 0.0005404353141784668, 0.0007059574127197266, 0.0008714795112609863, 0.001037001609802246, 0.0012025237083435059, 0.0013680458068847656, 0.0015335679054260254, 0.0016990900039672852, 0.001864612102508545, 0.0020301342010498047, 0.0021956562995910645, 0.0023611783981323242, 0.002526700496673584, 0.0026922225952148438, 0.0028577446937561035, 0.0030232667922973633, 0.003188788890838623, 0.003354310989379883, 0.0035198330879211426, 0.0036853551864624023, 0.003850877285003662, 0.004016399383544922, 0.004181921482086182, 0.004347443580627441, 0.004512965679168701, 0.004678487777709961, 0.004844009876251221, 0.0050095319747924805, 0.00517505407333374, 0.005340576171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 2.0, 7.0, 11.0, 8.0, 25.0, 33.0, 58.0, 76.0, 116.0, 221.0, 343.0, 623.0, 1192.0, 2526.0, 5754.0, 15538.0, 50181.0, 214599.0, 602950.0, 107064.0, 29495.0, 9909.0, 3881.0, 1832.0, 902.0, 490.0, 273.0, 167.0, 97.0, 68.0, 43.0, 17.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269622802734375, -0.026127099990844727, -0.025291919708251953, -0.02445673942565918, -0.023621559143066406, -0.022786378860473633, -0.02195119857788086, -0.021116018295288086, -0.020280838012695312, -0.01944565773010254, -0.018610477447509766, -0.017775297164916992, -0.01694011688232422, -0.016104936599731445, -0.015269756317138672, -0.014434576034545898, -0.013599395751953125, -0.012764215469360352, -0.011929035186767578, -0.011093854904174805, -0.010258674621582031, -0.009423494338989258, -0.008588314056396484, -0.007753133773803711, -0.0069179534912109375, -0.006082773208618164, -0.005247592926025391, -0.004412412643432617, -0.0035772323608398438, -0.0027420520782470703, -0.0019068717956542969, -0.0010716915130615234, -0.00023651123046875, 0.0005986690521240234, 0.0014338493347167969, 0.0022690296173095703, 0.0031042098999023438, 0.003939390182495117, 0.004774570465087891, 0.005609750747680664, 0.0064449310302734375, 0.007280111312866211, 0.008115291595458984, 0.008950471878051758, 0.009785652160644531, 0.010620832443237305, 0.011456012725830078, 0.012291193008422852, 0.013126373291015625, 0.013961553573608398, 0.014796733856201172, 0.015631914138793945, 0.01646709442138672, 0.017302274703979492, 0.018137454986572266, 0.01897263526916504, 0.019807815551757812, 0.020642995834350586, 0.02147817611694336, 0.022313356399536133, 0.023148536682128906, 0.02398371696472168, 0.024818897247314453, 0.025654077529907227, 0.0264892578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 17.0, 23.0, 37.0, 78.0, 93.0, 191.0, 177.0, 118.0, 68.0, 41.0, 30.0, 28.0, 22.0, 15.0, 11.0, 8.0, 8.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074348836205899715, -0.007020418532192707, -0.006605953443795443, -0.006191488355398178, -0.005777023732662201, -0.005362558178603649, -0.004948093555867672, -0.0045336284674704075, -0.004119163379073143, -0.0037046982906758785, -0.003290233202278614, -0.0028757683467119932, -0.0024613032583147287, -0.0020468381699174643, -0.0016323733143508434, -0.001217908225953579, -0.0008034431375563145, -0.0003889781073667109, 2.5486922822892666e-05, 0.0004399518948048353, 0.0008544169832020998, 0.0012688820715993643, 0.001683346927165985, 0.0020978120155632496, 0.002512277103960514, 0.0029267421923577785, 0.003341207280755043, 0.003755672136321664, 0.004170137457549572, 0.004584602080285549, 0.004999067168682814, 0.005413532257080078, 0.005827996879816055, 0.00624246196821332, 0.006656927056610584, 0.007071391679346561, 0.007485857233405113, 0.00790032185614109, 0.008314786478877068, 0.00872925203293562, 0.009143717586994171, 0.009558182209730148, 0.0099726477637887, 0.010387112386524677, 0.010801577940583229, 0.011216042563319206, 0.011630507186055183, 0.012044972740113735, 0.012459437362849712, 0.01287390198558569, 0.013288367539644241, 0.013702832162380219, 0.01411729771643877, 0.014531762339174747, 0.0149462278932333, 0.015360692515969276, 0.015775157138705254, 0.01618962176144123, 0.016604086384177208, 0.017018552869558334, 0.01743301749229431, 0.01784748211503029, 0.018261946737766266, 0.018676411360502243, 0.01909087784588337]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 7.0, 6.0, 4.0, 11.0, 11.0, 8.0, 9.0, 17.0, 17.0, 16.0, 16.0, 27.0, 24.0, 22.0, 25.0, 29.0, 28.0, 30.0, 36.0, 31.0, 40.0, 34.0, 35.0, 42.0, 24.0, 33.0, 44.0, 26.0, 24.0, 37.0, 35.0, 31.0, 18.0, 24.0, 20.0, 17.0, 21.0, 19.0, 12.0, 10.0, 11.0, 15.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.004262208938598633, -0.004122590646147728, -0.003982972353696823, -0.0038433540612459183, -0.0037037357687950134, -0.0035641174763441086, -0.0034244991838932037, -0.003284880891442299, -0.003145262598991394, -0.003005644306540489, -0.0028660260140895844, -0.0027264077216386795, -0.0025867894291877747, -0.00244717113673687, -0.002307552844285965, -0.00216793455183506, -0.0020283162593841553, -0.0018886979669332504, -0.0017490796744823456, -0.0016094613820314407, -0.0014698430895805359, -0.001330224797129631, -0.0011906065046787262, -0.0010509882122278214, -0.0009113699197769165, -0.0007717516273260117, -0.0006321333348751068, -0.000492515042424202, -0.0003528967499732971, -0.00021327845752239227, -7.366016507148743e-05, 6.595812737941742e-05, 0.00020557641983032227, 0.0003451947122812271, 0.00048481300473213196, 0.0006244312971830368, 0.0007640495896339417, 0.0009036678820848465, 0.0010432861745357513, 0.0011829044669866562, 0.001322522759437561, 0.0014621410518884659, 0.0016017593443393707, 0.0017413776367902756, 0.0018809959292411804, 0.0020206142216920853, 0.00216023251414299, 0.002299850806593895, 0.0024394690990448, 0.0025790873914957047, 0.0027187056839466095, 0.0028583239763975143, 0.002997942268848419, 0.003137560561299324, 0.003277178853750229, 0.0034167971462011337, 0.0035564154386520386, 0.0036960337311029434, 0.0038356520235538483, 0.003975270316004753, 0.004114888608455658, 0.004254506900906563, 0.004394125193357468, 0.0045337434858083725, 0.004673361778259277]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 3.0, 18.0, 17.0, 11.0, 10.0, 20.0, 22.0, 23.0, 30.0, 30.0, 34.0, 35.0, 39.0, 34.0, 35.0, 39.0, 43.0, 40.0, 37.0, 27.0, 38.0, 49.0, 33.0, 30.0, 37.0, 32.0, 34.0, 32.0, 26.0, 23.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.625, -169.939453125, -164.25390625, -158.568359375, -152.8828125, -147.197265625, -141.51171875, -135.826171875, -130.140625, -124.455078125, -118.76953125, -113.083984375, -107.3984375, -101.712890625, -96.02734375, -90.341796875, -84.65625, -78.970703125, -73.28515625, -67.599609375, -61.9140625, -56.228515625, -50.54296875, -44.857421875, -39.171875, -33.486328125, -27.80078125, -22.115234375, -16.4296875, -10.744140625, -5.05859375, 0.626953125, 6.3125, 11.998046875, 17.68359375, 23.369140625, 29.0546875, 34.740234375, 40.42578125, 46.111328125, 51.796875, 57.482421875, 63.16796875, 68.853515625, 74.5390625, 80.224609375, 85.91015625, 91.595703125, 97.28125, 102.966796875, 108.65234375, 114.337890625, 120.0234375, 125.708984375, 131.39453125, 137.080078125, 142.765625, 148.451171875, 154.13671875, 159.822265625, 165.5078125, 171.193359375, 176.87890625, 182.564453125, 188.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 7.0, 3.0, 14.0, 15.0, 13.0, 18.0, 22.0, 38.0, 65.0, 69.0, 116.0, 208.0, 430.0, 790.0, 1873.0, 5245.0, 16726.0, 66401.0, 332885.0, 483447.0, 103482.0, 24694.0, 7224.0, 2540.0, 1065.0, 456.0, 253.0, 125.0, 79.0, 63.0, 50.0, 28.0, 18.0, 12.0, 18.0, 4.0, 13.0, 10.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.90625, -28.946044921875, -27.98583984375, -27.025634765625, -26.0654296875, -25.105224609375, -24.14501953125, -23.184814453125, -22.224609375, -21.264404296875, -20.30419921875, -19.343994140625, -18.3837890625, -17.423583984375, -16.46337890625, -15.503173828125, -14.54296875, -13.582763671875, -12.62255859375, -11.662353515625, -10.7021484375, -9.741943359375, -8.78173828125, -7.821533203125, -6.861328125, -5.901123046875, -4.94091796875, -3.980712890625, -3.0205078125, -2.060302734375, -1.10009765625, -0.139892578125, 0.8203125, 1.780517578125, 2.74072265625, 3.700927734375, 4.6611328125, 5.621337890625, 6.58154296875, 7.541748046875, 8.501953125, 9.462158203125, 10.42236328125, 11.382568359375, 12.3427734375, 13.302978515625, 14.26318359375, 15.223388671875, 16.18359375, 17.143798828125, 18.10400390625, 19.064208984375, 20.0244140625, 20.984619140625, 21.94482421875, 22.905029296875, 23.865234375, 24.825439453125, 25.78564453125, 26.745849609375, 27.7060546875, 28.666259765625, 29.62646484375, 30.586669921875, 31.546875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 15.0, 24.0, 34.0, 51.0, 78.0, 94.0, 107.0, 148.0, 2085.0, 76.0, 88.0, 73.0, 55.0, 36.0, 30.0, 16.0, 11.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-510.5, -494.0703125, -477.640625, -461.2109375, -444.78125, -428.3515625, -411.921875, -395.4921875, -379.0625, -362.6328125, -346.203125, -329.7734375, -313.34375, -296.9140625, -280.484375, -264.0546875, -247.625, -231.1953125, -214.765625, -198.3359375, -181.90625, -165.4765625, -149.046875, -132.6171875, -116.1875, -99.7578125, -83.328125, -66.8984375, -50.46875, -34.0390625, -17.609375, -1.1796875, 15.25, 31.6796875, 48.109375, 64.5390625, 80.96875, 97.3984375, 113.828125, 130.2578125, 146.6875, 163.1171875, 179.546875, 195.9765625, 212.40625, 228.8359375, 245.265625, 261.6953125, 278.125, 294.5546875, 310.984375, 327.4140625, 343.84375, 360.2734375, 376.703125, 393.1328125, 409.5625, 425.9921875, 442.421875, 458.8515625, 475.28125, 491.7109375, 508.140625, 524.5703125, 541.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 11.0, 15.0, 18.0, 43.0, 43.0, 63.0, 170.0, 205.0, 404.0, 831.0, 2601.0, 27793.0, 2947763.0, 156884.0, 6291.0, 1237.0, 525.0, 303.0, 178.0, 108.0, 66.0, 45.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.9375, -53.8447265625, -51.751953125, -49.6591796875, -47.56640625, -45.4736328125, -43.380859375, -41.2880859375, -39.1953125, -37.1025390625, -35.009765625, -32.9169921875, -30.82421875, -28.7314453125, -26.638671875, -24.5458984375, -22.453125, -20.3603515625, -18.267578125, -16.1748046875, -14.08203125, -11.9892578125, -9.896484375, -7.8037109375, -5.7109375, -3.6181640625, -1.525390625, 0.5673828125, 2.66015625, 4.7529296875, 6.845703125, 8.9384765625, 11.03125, 13.1240234375, 15.216796875, 17.3095703125, 19.40234375, 21.4951171875, 23.587890625, 25.6806640625, 27.7734375, 29.8662109375, 31.958984375, 34.0517578125, 36.14453125, 38.2373046875, 40.330078125, 42.4228515625, 44.515625, 46.6083984375, 48.701171875, 50.7939453125, 52.88671875, 54.9794921875, 57.072265625, 59.1650390625, 61.2578125, 63.3505859375, 65.443359375, 67.5361328125, 69.62890625, 71.7216796875, 73.814453125, 75.9072265625, 78.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 11.0, 16.0, 22.0, 33.0, 77.0, 131.0, 167.0, 186.0, 146.0, 74.0, 36.0, 31.0, 21.0, 11.0, 5.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.74658203125, -414.37811279296875, -401.0096435546875, -387.64117431640625, -374.272705078125, -360.90423583984375, -347.5357971191406, -334.1673278808594, -320.7988586425781, -307.4303894042969, -294.0619201660156, -280.6934509277344, -267.32501220703125, -253.95652770996094, -240.58807373046875, -227.2196044921875, -213.85113525390625, -200.482666015625, -187.11419677734375, -173.74574279785156, -160.3772735595703, -147.00880432128906, -133.64035034179688, -120.27188110351562, -106.90341186523438, -93.53494262695312, -80.1664810180664, -66.79801940917969, -53.42955017089844, -40.06108093261719, -26.69261932373047, -13.32415771484375, 0.044281005859375, 13.41274642944336, 26.781211853027344, 40.14967727661133, 53.51814270019531, 66.88661193847656, 80.25507354736328, 93.62353515625, 106.99200439453125, 120.3604736328125, 133.72894287109375, 147.09739685058594, 160.4658660888672, 173.83433532714844, 187.20278930664062, 200.57125854492188, 213.93972778320312, 227.30819702148438, 240.67666625976562, 254.0451202392578, 267.41357421875, 280.78204345703125, 294.1505126953125, 307.51898193359375, 320.887451171875, 334.25592041015625, 347.6243896484375, 360.99285888671875, 374.361328125, 387.72979736328125, 401.0982360839844, 414.4667053222656, 427.8351745605469]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 12.0, 16.0, 14.0, 17.0, 12.0, 19.0, 18.0, 23.0, 35.0, 22.0, 38.0, 46.0, 43.0, 41.0, 38.0, 42.0, 43.0, 43.0, 44.0, 43.0, 37.0, 31.0, 36.0, 28.0, 33.0, 22.0, 24.0, 26.0, 24.0, 18.0, 15.0, 16.0, 12.0, 8.0, 2.0, 8.0, 9.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.82275390625, -311.8260192871094, -300.8292541503906, -289.83251953125, -278.83575439453125, -267.8390197753906, -256.84228515625, -245.8455352783203, -234.84878540039062, -223.85203552246094, -212.85528564453125, -201.85855102539062, -190.86180114746094, -179.86505126953125, -168.86831665039062, -157.87156677246094, -146.87481689453125, -135.87806701660156, -124.8813247680664, -113.88458251953125, -102.88783264160156, -91.89108276367188, -80.89434051513672, -69.89759826660156, -58.900848388671875, -47.90410232543945, -36.90735626220703, -25.91061019897461, -14.913864135742188, -3.9171180725097656, 7.079627990722656, 18.076370239257812, 29.0731201171875, 40.06986618041992, 51.066612243652344, 62.063358306884766, 73.06010437011719, 84.05685424804688, 95.05359649658203, 106.05033874511719, 117.04708862304688, 128.04383850097656, 139.04058837890625, 150.03732299804688, 161.03407287597656, 172.03082275390625, 183.02755737304688, 194.02430725097656, 205.02105712890625, 216.01780700683594, 227.01455688476562, 238.01129150390625, 249.00804138183594, 260.0047912597656, 271.00152587890625, 281.998291015625, 292.9950256347656, 303.99176025390625, 314.988525390625, 325.9852600097656, 336.98199462890625, 347.978759765625, 358.9754943847656, 369.97222900390625, 380.968994140625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 10.0, 14.0, 22.0, 23.0, 27.0, 33.0, 37.0, 58.0, 68.0, 77.0, 87.0, 131.0, 155.0, 203.0, 282.0, 391.0, 562.0, 895.0, 1041470.0, 1215.0, 714.0, 509.0, 391.0, 265.0, 195.0, 135.0, 109.0, 82.0, 80.0, 61.0, 46.0, 40.0, 29.0, 25.0, 23.0, 14.0, 11.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-129.21395874023438, -125.506103515625, -121.79825592041016, -118.09040069580078, -114.38255310058594, -110.67469787597656, -106.96684265136719, -103.25899505615234, -99.55113983154297, -95.8432846069336, -92.13543701171875, -88.42758178710938, -84.71973419189453, -81.01187896728516, -77.30403137207031, -73.59617614746094, -69.88832092285156, -66.18046569824219, -62.472618103027344, -58.76476287841797, -55.05691146850586, -51.34906005859375, -47.64120864868164, -43.93335723876953, -40.22550964355469, -36.51765823364258, -32.80980682373047, -29.101953506469727, -25.394100189208984, -21.686248779296875, -17.978397369384766, -14.270544052124023, -10.562690734863281, -6.8548383712768555, -3.146986484527588, 0.5608654022216797, 4.2687177658081055, 7.976570129394531, 11.68442153930664, 15.392274856567383, 19.100126266479492, 22.8079776763916, 26.515830993652344, 30.223682403564453, 33.93153381347656, 37.63938903808594, 41.34723663330078, 45.055091857910156, 48.762943267822266, 52.470794677734375, 56.178646087646484, 59.886497497558594, 63.59435272216797, 67.30220031738281, 71.01005554199219, 74.71791076660156, 78.4257583618164, 82.13361358642578, 85.84146118164062, 89.54931640625, 93.25716400146484, 96.96501922607422, 100.67286682128906, 104.38072204589844, 108.08857727050781]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 9.0, 11.0, 20.0, 22.0, 31.0, 46.0, 129.0, 796.0, 51427168.0, 34027.0, 662.0, 108.0, 41.0, 18.0, 16.0, 9.0, 5.0, 8.0, 13.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-947.4556884765625, -910.9619750976562, -874.46826171875, -837.9745483398438, -801.4808349609375, -764.9871826171875, -728.4934692382812, -691.999755859375, -655.5060424804688, -619.0123291015625, -582.5186157226562, -546.02490234375, -509.5312194824219, -473.0375061035156, -436.5438232421875, -400.05010986328125, -363.556396484375, -327.06268310546875, -290.5689697265625, -254.07528686523438, -217.58157348632812, -181.08786010742188, -144.5941619873047, -108.1004638671875, -71.60675048828125, -35.11304473876953, 1.3806610107421875, 37.874366760253906, 74.36807250976562, 110.86178588867188, 147.35548400878906, 183.84918212890625, 220.3427734375, 256.83648681640625, 293.3302001953125, 329.8238830566406, 366.3175964355469, 402.8113098144531, 439.30499267578125, 475.7987060546875, 512.2924194335938, 548.7861328125, 585.2798461914062, 621.7735595703125, 658.2672119140625, 694.760986328125, 731.254638671875, 767.7483520507812, 804.2420654296875, 840.7357788085938, 877.2294921875, 913.7232055664062, 950.2169189453125, 986.7105712890625, 1023.2042846679688, 1059.697998046875, 1096.191650390625, 1132.685302734375, 1169.1790771484375, 1205.6727294921875, 1242.16650390625, 1278.66015625, 1315.1539306640625, 1351.6475830078125, 1388.141357421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 15.0, 22.0, 38.0, 78.0, 171.0, 239.0, 400.0, 516.0, 761.0, 1069.0, 1518.0, 2360.0, 3605.0, 5586.0, 8668.0, 14220.0, 22126.0, 36893.0, 61161.0, 104489.0, 182662.0, 339232.0, 686611.0, 3895359.0, 403631.0, 215679.0, 121105.0, 71208.0, 42044.0, 25633.0, 15983.0, 9860.0, 6256.0, 4240.0, 2722.0, 1786.0, 1171.0, 772.0, 456.0, 345.0, 214.0, 137.0, 98.0, 76.0, 74.0, 54.0, 34.0, 23.0, 8.0, 7.0, 0.0, 0.0, 2.0], "bins": [-1.248046875, -1.21148681640625, -1.1749267578125, -1.13836669921875, -1.101806640625, -1.06524658203125, -1.0286865234375, -0.99212646484375, -0.95556640625, -0.91900634765625, -0.8824462890625, -0.84588623046875, -0.809326171875, -0.77276611328125, -0.7362060546875, -0.69964599609375, -0.6630859375, -0.62652587890625, -0.5899658203125, -0.55340576171875, -0.516845703125, -0.48028564453125, -0.4437255859375, -0.40716552734375, -0.37060546875, -0.33404541015625, -0.2974853515625, -0.26092529296875, -0.224365234375, -0.18780517578125, -0.1512451171875, -0.11468505859375, -0.078125, -0.04156494140625, -0.0050048828125, 0.03155517578125, 0.068115234375, 0.10467529296875, 0.1412353515625, 0.17779541015625, 0.21435546875, 0.25091552734375, 0.2874755859375, 0.32403564453125, 0.360595703125, 0.39715576171875, 0.4337158203125, 0.47027587890625, 0.5068359375, 0.54339599609375, 0.5799560546875, 0.61651611328125, 0.653076171875, 0.68963623046875, 0.7261962890625, 0.76275634765625, 0.79931640625, 0.83587646484375, 0.8724365234375, 0.90899658203125, 0.945556640625, 0.98211669921875, 1.0186767578125, 1.05523681640625, 1.091796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 7.0, 11.0, 14.0, 10.0, 25.0, 16.0, 32.0, 26.0, 27.0, 42.0, 32.0, 41.0, 32.0, 37.0, 40.0, 39.0, 1087.0, 37.0, 51.0, 41.0, 35.0, 35.0, 44.0, 27.0, 33.0, 36.0, 24.0, 26.0, 27.0, 14.0, 10.0, 11.0, 7.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0], "bins": [-114.6875, -111.4384765625, -108.189453125, -104.9404296875, -101.69140625, -98.4423828125, -95.193359375, -91.9443359375, -88.6953125, -85.4462890625, -82.197265625, -78.9482421875, -75.69921875, -72.4501953125, -69.201171875, -65.9521484375, -62.703125, -59.4541015625, -56.205078125, -52.9560546875, -49.70703125, -46.4580078125, -43.208984375, -39.9599609375, -36.7109375, -33.4619140625, -30.212890625, -26.9638671875, -23.71484375, -20.4658203125, -17.216796875, -13.9677734375, -10.71875, -7.4697265625, -4.220703125, -0.9716796875, 2.27734375, 5.5263671875, 8.775390625, 12.0244140625, 15.2734375, 18.5224609375, 21.771484375, 25.0205078125, 28.26953125, 31.5185546875, 34.767578125, 38.0166015625, 41.265625, 44.5146484375, 47.763671875, 51.0126953125, 54.26171875, 57.5107421875, 60.759765625, 64.0087890625, 67.2578125, 70.5068359375, 73.755859375, 77.0048828125, 80.25390625, 83.5029296875, 86.751953125, 90.0009765625, 93.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 5.0, 5.0, 10.0, 18.0, 13.0, 30.0, 49.0, 54.0, 58.0, 122.0, 133.0, 216.0, 329.0, 497.0, 697.0, 1037.0, 1463.0, 2079.0, 3157.0, 4877.0, 7059.0, 10526.0, 16452.0, 24488.0, 37595.0, 57265.0, 88896.0, 143730.0, 249456.0, 474989.0, 4007283.0, 492365.0, 255988.0, 148192.0, 90765.0, 58786.0, 38065.0, 25262.0, 16427.0, 11012.0, 7142.0, 4888.0, 3155.0, 2086.0, 1489.0, 1044.0, 642.0, 455.0, 331.0, 245.0, 174.0, 114.0, 56.0, 59.0, 25.0, 28.0, 19.0, 12.0, 18.0, 10.0, 5.0], "bins": [-1.482421875, -1.438201904296875, -1.39398193359375, -1.349761962890625, -1.3055419921875, -1.261322021484375, -1.21710205078125, -1.172882080078125, -1.128662109375, -1.084442138671875, -1.04022216796875, -0.996002197265625, -0.9517822265625, -0.907562255859375, -0.86334228515625, -0.819122314453125, -0.77490234375, -0.730682373046875, -0.68646240234375, -0.642242431640625, -0.5980224609375, -0.553802490234375, -0.50958251953125, -0.465362548828125, -0.421142578125, -0.376922607421875, -0.33270263671875, -0.288482666015625, -0.2442626953125, -0.200042724609375, -0.15582275390625, -0.111602783203125, -0.0673828125, -0.023162841796875, 0.02105712890625, 0.065277099609375, 0.1094970703125, 0.153717041015625, 0.19793701171875, 0.242156982421875, 0.286376953125, 0.330596923828125, 0.37481689453125, 0.419036865234375, 0.4632568359375, 0.507476806640625, 0.55169677734375, 0.595916748046875, 0.64013671875, 0.684356689453125, 0.72857666015625, 0.772796630859375, 0.8170166015625, 0.861236572265625, 0.90545654296875, 0.949676513671875, 0.993896484375, 1.038116455078125, 1.08233642578125, 1.126556396484375, 1.1707763671875, 1.214996337890625, 1.25921630859375, 1.303436279296875, 1.34765625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 3.0, 4.0, 11.0, 15.0, 13.0, 14.0, 20.0, 21.0, 24.0, 24.0, 24.0, 30.0, 35.0, 33.0, 46.0, 35.0, 43.0, 40.0, 33.0, 1062.0, 29.0, 43.0, 34.0, 39.0, 36.0, 33.0, 26.0, 25.0, 25.0, 24.0, 22.0, 27.0, 23.0, 14.0, 17.0, 18.0, 5.0, 12.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.5, -124.275390625, -120.05078125, -115.826171875, -111.6015625, -107.376953125, -103.15234375, -98.927734375, -94.703125, -90.478515625, -86.25390625, -82.029296875, -77.8046875, -73.580078125, -69.35546875, -65.130859375, -60.90625, -56.681640625, -52.45703125, -48.232421875, -44.0078125, -39.783203125, -35.55859375, -31.333984375, -27.109375, -22.884765625, -18.66015625, -14.435546875, -10.2109375, -5.986328125, -1.76171875, 2.462890625, 6.6875, 10.912109375, 15.13671875, 19.361328125, 23.5859375, 27.810546875, 32.03515625, 36.259765625, 40.484375, 44.708984375, 48.93359375, 53.158203125, 57.3828125, 61.607421875, 65.83203125, 70.056640625, 74.28125, 78.505859375, 82.73046875, 86.955078125, 91.1796875, 95.404296875, 99.62890625, 103.853515625, 108.078125, 112.302734375, 116.52734375, 120.751953125, 124.9765625, 129.201171875, 133.42578125, 137.650390625, 141.875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 21.0, 13.0, 31.0, 55.0, 63.0, 109.0, 120.0, 150.0, 253.0, 382.0, 455.0, 644.0, 854.0, 1324.0, 1746.0, 2452.0, 3451.0, 5080.0, 7461.0, 10768.0, 16349.0, 26865.0, 48420.0, 141316.0, 5745100.0, 149459.0, 49473.0, 26939.0, 16649.0, 10720.0, 7543.0, 5030.0, 3426.0, 2367.0, 1833.0, 1219.0, 862.0, 687.0, 499.0, 322.0, 244.0, 184.0, 137.0, 81.0, 70.0, 42.0, 36.0, 54.0, 23.0, 10.0, 5.0, 3.0, 5.0, 7.0, 4.0], "bins": [-3.71875, -3.6077880859375, -3.496826171875, -3.3858642578125, -3.27490234375, -3.1639404296875, -3.052978515625, -2.9420166015625, -2.8310546875, -2.7200927734375, -2.609130859375, -2.4981689453125, -2.38720703125, -2.2762451171875, -2.165283203125, -2.0543212890625, -1.943359375, -1.8323974609375, -1.721435546875, -1.6104736328125, -1.49951171875, -1.3885498046875, -1.277587890625, -1.1666259765625, -1.0556640625, -0.9447021484375, -0.833740234375, -0.7227783203125, -0.61181640625, -0.5008544921875, -0.389892578125, -0.2789306640625, -0.16796875, -0.0570068359375, 0.053955078125, 0.1649169921875, 0.27587890625, 0.3868408203125, 0.497802734375, 0.6087646484375, 0.7197265625, 0.8306884765625, 0.941650390625, 1.0526123046875, 1.16357421875, 1.2745361328125, 1.385498046875, 1.4964599609375, 1.607421875, 1.7183837890625, 1.829345703125, 1.9403076171875, 2.05126953125, 2.1622314453125, 2.273193359375, 2.3841552734375, 2.4951171875, 2.6060791015625, 2.717041015625, 2.8280029296875, 2.93896484375, 3.0499267578125, 3.160888671875, 3.2718505859375, 3.3828125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 11.0, 13.0, 12.0, 13.0, 13.0, 11.0, 25.0, 21.0, 31.0, 35.0, 33.0, 22.0, 35.0, 39.0, 48.0, 46.0, 44.0, 1069.0, 41.0, 38.0, 46.0, 34.0, 37.0, 31.0, 35.0, 33.0, 34.0, 20.0, 21.0, 17.0, 13.0, 15.0, 8.0, 15.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-194.25, -188.568359375, -182.88671875, -177.205078125, -171.5234375, -165.841796875, -160.16015625, -154.478515625, -148.796875, -143.115234375, -137.43359375, -131.751953125, -126.0703125, -120.388671875, -114.70703125, -109.025390625, -103.34375, -97.662109375, -91.98046875, -86.298828125, -80.6171875, -74.935546875, -69.25390625, -63.572265625, -57.890625, -52.208984375, -46.52734375, -40.845703125, -35.1640625, -29.482421875, -23.80078125, -18.119140625, -12.4375, -6.755859375, -1.07421875, 4.607421875, 10.2890625, 15.970703125, 21.65234375, 27.333984375, 33.015625, 38.697265625, 44.37890625, 50.060546875, 55.7421875, 61.423828125, 67.10546875, 72.787109375, 78.46875, 84.150390625, 89.83203125, 95.513671875, 101.1953125, 106.876953125, 112.55859375, 118.240234375, 123.921875, 129.603515625, 135.28515625, 140.966796875, 146.6484375, 152.330078125, 158.01171875, 163.693359375, 169.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 8.0, 17.0, 30.0, 50.0, 94.0, 503.0, 135.0, 42.0, 34.0, 19.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.89189147949219, -105.8975601196289, -99.9032211303711, -93.90888977050781, -87.91455078125, -81.92021942138672, -75.92588806152344, -69.93154907226562, -63.937217712402344, -57.9428825378418, -51.94854736328125, -45.95421600341797, -39.95988082885742, -33.965545654296875, -27.971214294433594, -21.976879119873047, -15.9825439453125, -9.98820972442627, -3.993875503540039, 2.000457763671875, 7.994792938232422, 13.989128112792969, 19.98345947265625, 25.977794647216797, 31.972129821777344, 37.96646499633789, 43.96080017089844, 49.95513153076172, 55.949466705322266, 61.94380187988281, 67.9381332397461, 73.93246459960938, 79.92678833007812, 85.9211196899414, 91.91545867919922, 97.9097900390625, 103.90412902832031, 109.8984603881836, 115.89279174804688, 121.88713073730469, 127.88146209716797, 133.87579345703125, 139.87013244628906, 145.86447143554688, 151.85879516601562, 157.85313415527344, 163.84747314453125, 169.841796875, 175.8361358642578, 181.83047485351562, 187.82479858398438, 193.8191375732422, 199.8134765625, 205.80780029296875, 211.80213928222656, 217.79647827148438, 223.79080200195312, 229.78514099121094, 235.7794647216797, 241.7738037109375, 247.7681427001953, 253.76248168945312, 259.7568054199219, 265.7511291503906, 271.7454833984375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 13.0, 50.0, 308.0, 463.0, 122.0, 18.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1459.41357421875, -1422.2220458984375, -1385.030517578125, -1347.8388671875, -1310.6473388671875, -1273.455810546875, -1236.2642822265625, -1199.07275390625, -1161.881103515625, -1124.6895751953125, -1087.498046875, -1050.306396484375, -1013.1148681640625, -975.92333984375, -938.7318115234375, -901.5402221679688, -864.3486938476562, -827.1571655273438, -789.965576171875, -752.7740478515625, -715.5824584960938, -678.3909301757812, -641.1993408203125, -604.0078125, -566.8162841796875, -529.624755859375, -492.43316650390625, -455.24163818359375, -418.050048828125, -380.8585205078125, -343.6669616699219, -306.47540283203125, -269.28375244140625, -232.09219360351562, -194.900634765625, -157.70909118652344, -120.51753234863281, -83.32597351074219, -46.134429931640625, -8.94287109375, 28.248687744140625, 65.44024658203125, 102.63179779052734, 139.82334899902344, 177.01490783691406, 214.2064666748047, 251.39801025390625, 288.5895690917969, 325.7811279296875, 362.9726867675781, 400.16424560546875, 437.35577392578125, 474.54736328125, 511.7388916015625, 548.930419921875, 586.1220092773438, 623.3135986328125, 660.505126953125, 697.6967163085938, 734.8882446289062, 772.079833984375, 809.2713623046875, 846.462890625, 883.6544799804688, 920.8460083007812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 3.0, 7.0, 7.0, 6.0, 15.0, 7.0, 6.0, 21.0, 12.0, 14.0, 9.0, 16.0, 17.0, 15.0, 18.0, 9.0, 19.0, 19.0, 23.0, 28.0, 39.0, 46.0, 47.0, 66.0, 64.0, 76.0, 84.0, 89.0, 156.0, 257.0, 379.0, 647.0, 1059.0, 1865.0, 2874.0, 8490.0, 4126628.0, 34373.0, 7266.0, 4409.0, 2054.0, 1028.0, 562.0, 374.0, 263.0, 194.0, 159.0, 137.0, 94.0, 63.0, 56.0, 40.0, 24.0, 14.0, 9.0, 10.0, 7.0], "bins": [-11.703125, -11.43695068359375, -11.1707763671875, -10.90460205078125, -10.638427734375, -10.37225341796875, -10.1060791015625, -9.83990478515625, -9.57373046875, -9.30755615234375, -9.0413818359375, -8.77520751953125, -8.509033203125, -8.24285888671875, -7.9766845703125, -7.71051025390625, -7.4443359375, -7.17816162109375, -6.9119873046875, -6.64581298828125, -6.379638671875, -6.11346435546875, -5.8472900390625, -5.58111572265625, -5.31494140625, -5.04876708984375, -4.7825927734375, -4.51641845703125, -4.250244140625, -3.98406982421875, -3.7178955078125, -3.45172119140625, -3.185546875, -2.91937255859375, -2.6531982421875, -2.38702392578125, -2.120849609375, -1.85467529296875, -1.5885009765625, -1.32232666015625, -1.05615234375, -0.78997802734375, -0.5238037109375, -0.25762939453125, 0.008544921875, 0.27471923828125, 0.5408935546875, 0.80706787109375, 1.0732421875, 1.33941650390625, 1.6055908203125, 1.87176513671875, 2.137939453125, 2.40411376953125, 2.6702880859375, 2.93646240234375, 3.20263671875, 3.46881103515625, 3.7349853515625, 4.00115966796875, 4.267333984375, 4.53350830078125, 4.7996826171875, 5.06585693359375, 5.33203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 22.0, 27.0, 463.0, 403.0, 22.0, 14.0, 16.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7610969543457031, -0.7433853149414062, -0.7256736755371094, -0.7079620361328125, -0.6902503967285156, -0.6725387573242188, -0.6548271179199219, -0.637115478515625, -0.6194038391113281, -0.6016921997070312, -0.5839805603027344, -0.5662689208984375, -0.5485572814941406, -0.5308456420898438, -0.5131340026855469, -0.49542236328125, -0.4777107238769531, -0.45999908447265625, -0.4422874450683594, -0.4245758056640625, -0.4068641662597656, -0.38915252685546875, -0.3714408874511719, -0.353729248046875, -0.3360176086425781, -0.31830596923828125, -0.3005943298339844, -0.2828826904296875, -0.2651710510253906, -0.24745941162109375, -0.22974777221679688, -0.2120361328125, -0.19432449340820312, -0.17661285400390625, -0.15890121459960938, -0.1411895751953125, -0.12347793579101562, -0.10576629638671875, -0.08805465698242188, -0.070343017578125, -0.052631378173828125, -0.03491973876953125, -0.017208099365234375, 0.0005035400390625, 0.018215179443359375, 0.03592681884765625, 0.053638458251953125, 0.07135009765625, 0.08906173706054688, 0.10677337646484375, 0.12448501586914062, 0.1421966552734375, 0.15990829467773438, 0.17761993408203125, 0.19533157348632812, 0.213043212890625, 0.23075485229492188, 0.24846649169921875, 0.2661781311035156, 0.2838897705078125, 0.3016014099121094, 0.31931304931640625, 0.3370246887207031, 0.354736328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 15.0, 18.0, 24.0, 34.0, 45.0, 71.0, 102.0, 130.0, 197.0, 313.0, 458.0, 717.0, 1222.0, 1972.0, 3600.0, 6696.0, 14394.0, 49162.0, 4050491.0, 36487.0, 12906.0, 6212.0, 3552.0, 2036.0, 1260.0, 766.0, 511.0, 319.0, 190.0, 119.0, 87.0, 47.0, 29.0, 26.0, 13.0, 7.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.431640625, -1.386016845703125, -1.34039306640625, -1.294769287109375, -1.2491455078125, -1.203521728515625, -1.15789794921875, -1.112274169921875, -1.066650390625, -1.021026611328125, -0.97540283203125, -0.929779052734375, -0.8841552734375, -0.838531494140625, -0.79290771484375, -0.747283935546875, -0.70166015625, -0.656036376953125, -0.61041259765625, -0.564788818359375, -0.5191650390625, -0.473541259765625, -0.42791748046875, -0.382293701171875, -0.336669921875, -0.291046142578125, -0.24542236328125, -0.199798583984375, -0.1541748046875, -0.108551025390625, -0.06292724609375, -0.017303466796875, 0.0283203125, 0.073944091796875, 0.11956787109375, 0.165191650390625, 0.2108154296875, 0.256439208984375, 0.30206298828125, 0.347686767578125, 0.393310546875, 0.438934326171875, 0.48455810546875, 0.530181884765625, 0.5758056640625, 0.621429443359375, 0.66705322265625, 0.712677001953125, 0.75830078125, 0.803924560546875, 0.84954833984375, 0.895172119140625, 0.9407958984375, 0.986419677734375, 1.03204345703125, 1.077667236328125, 1.123291015625, 1.168914794921875, 1.21453857421875, 1.260162353515625, 1.3057861328125, 1.351409912109375, 1.39703369140625, 1.442657470703125, 1.48828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 10.0, 9.0, 14.0, 15.0, 22.0, 18.0, 144.0, 3635.0, 28.0, 21.0, 17.0, 22.0, 16.0, 15.0, 10.0, 11.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6380386352539062, -0.6212921142578125, -0.6045455932617188, -0.587799072265625, -0.5710525512695312, -0.5543060302734375, -0.5375595092773438, -0.52081298828125, -0.5040664672851562, -0.4873199462890625, -0.47057342529296875, -0.453826904296875, -0.43708038330078125, -0.4203338623046875, -0.40358734130859375, -0.3868408203125, -0.37009429931640625, -0.3533477783203125, -0.33660125732421875, -0.319854736328125, -0.30310821533203125, -0.2863616943359375, -0.26961517333984375, -0.25286865234375, -0.23612213134765625, -0.2193756103515625, -0.20262908935546875, -0.185882568359375, -0.16913604736328125, -0.1523895263671875, -0.13564300537109375, -0.118896484375, -0.10214996337890625, -0.0854034423828125, -0.06865692138671875, -0.051910400390625, -0.03516387939453125, -0.0184173583984375, -0.00167083740234375, 0.01507568359375, 0.03182220458984375, 0.0485687255859375, 0.06531524658203125, 0.082061767578125, 0.09880828857421875, 0.1155548095703125, 0.13230133056640625, 0.1490478515625, 0.16579437255859375, 0.1825408935546875, 0.19928741455078125, 0.216033935546875, 0.23278045654296875, 0.2495269775390625, 0.26627349853515625, 0.28302001953125, 0.29976654052734375, 0.3165130615234375, 0.33325958251953125, 0.350006103515625, 0.36675262451171875, 0.3834991455078125, 0.40024566650390625, 0.4169921875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 14.0, 66.0, 782.0, 95.0, 19.0, 15.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5481555461883545, -2.2760331630706787, -2.003910541534424, -1.731788158416748, -1.4596656560897827, -1.1875431537628174, -0.9154207706451416, -0.6432982683181763, -0.37117576599121094, -0.099053293466568, 0.17306917905807495, 0.4451916217803955, 0.7173141241073608, 0.9894366264343262, 1.261559009552002, 1.5336815118789673, 1.8058040142059326, 2.0779263973236084, 2.3500490188598633, 2.622171401977539, 2.894293785095215, 3.1664164066314697, 3.4385387897491455, 3.7106614112854004, 3.982783794403076, 4.254906177520752, 4.527028560638428, 4.799151420593262, 5.0712738037109375, 5.343396186828613, 5.615518569946289, 5.887640953063965, 6.159763336181641, 6.431885719299316, 6.704008102416992, 6.976130485534668, 7.248253345489502, 7.520375728607178, 7.7924981117248535, 8.064620971679688, 8.336743354797363, 8.608865737915039, 8.880988121032715, 9.15311050415039, 9.425232887268066, 9.697355270385742, 9.969478607177734, 10.24160099029541, 10.513723373413086, 10.785845756530762, 11.057968139648438, 11.330090522766113, 11.602212905883789, 11.874336242675781, 12.14645767211914, 12.418581008911133, 12.690702438354492, 12.962824821472168, 13.234947204589844, 13.50706958770752, 13.779191970825195, 14.051315307617188, 14.323436737060547, 14.595560073852539, 14.867682456970215]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 22.0, 30.0, 45.0, 71.0, 97.0, 136.0, 141.0, 160.0, 116.0, 60.0, 47.0, 21.0, 13.0, 15.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.243732213973999, -3.1306803226470947, -3.0176284313201904, -2.904576539993286, -2.791524648666382, -2.6784727573394775, -2.5654208660125732, -2.452368974685669, -2.3393170833587646, -2.2262651920318604, -2.113213300704956, -2.0001614093780518, -1.8871095180511475, -1.7740576267242432, -1.6610057353973389, -1.5479538440704346, -1.4349019527435303, -1.321850061416626, -1.2087981700897217, -1.0957462787628174, -0.9826943874359131, -0.8696424961090088, -0.7565906047821045, -0.6435387134552002, -0.5304868221282959, -0.4174349308013916, -0.3043830394744873, -0.191331148147583, -0.07827925682067871, 0.034772634506225586, 0.14782452583312988, 0.2608764171600342, 0.3739280700683594, 0.48697996139526367, 0.600031852722168, 0.7130837440490723, 0.8261356353759766, 0.9391875267028809, 1.0522394180297852, 1.1652913093566895, 1.2783432006835938, 1.391395092010498, 1.5044469833374023, 1.6174988746643066, 1.730550765991211, 1.8436026573181152, 1.9566545486450195, 2.069706439971924, 2.182758331298828, 2.2958102226257324, 2.4088621139526367, 2.521914005279541, 2.6349658966064453, 2.7480177879333496, 2.861069679260254, 2.974121570587158, 3.0871734619140625, 3.200225353240967, 3.313277244567871, 3.4263291358947754, 3.5393810272216797, 3.652432918548584, 3.7654848098754883, 3.8785367012023926, 3.991588592529297]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 13.0, 6.0, 15.0, 12.0, 13.0, 24.0, 23.0, 35.0, 85.0, 99.0, 150.0, 211.0, 452.0, 896.0, 2239.0, 8225.0, 83593.0, 937778.0, 9856.0, 2598.0, 988.0, 457.0, 257.0, 165.0, 110.0, 59.0, 55.0, 30.0, 17.0, 21.0, 19.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.203338623046875, -5.05902099609375, -4.914703369140625, -4.7703857421875, -4.626068115234375, -4.48175048828125, -4.337432861328125, -4.193115234375, -4.048797607421875, -3.90447998046875, -3.760162353515625, -3.6158447265625, -3.471527099609375, -3.32720947265625, -3.182891845703125, -3.03857421875, -2.894256591796875, -2.74993896484375, -2.605621337890625, -2.4613037109375, -2.316986083984375, -2.17266845703125, -2.028350830078125, -1.884033203125, -1.739715576171875, -1.59539794921875, -1.451080322265625, -1.3067626953125, -1.162445068359375, -1.01812744140625, -0.873809814453125, -0.7294921875, -0.585174560546875, -0.44085693359375, -0.296539306640625, -0.1522216796875, -0.007904052734375, 0.13641357421875, 0.280731201171875, 0.425048828125, 0.569366455078125, 0.71368408203125, 0.858001708984375, 1.0023193359375, 1.146636962890625, 1.29095458984375, 1.435272216796875, 1.57958984375, 1.723907470703125, 1.86822509765625, 2.012542724609375, 2.1568603515625, 2.301177978515625, 2.44549560546875, 2.589813232421875, 2.734130859375, 2.878448486328125, 3.02276611328125, 3.167083740234375, 3.3114013671875, 3.455718994140625, 3.60003662109375, 3.744354248046875, 3.888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 1.0, 10.0, 22.0, 30.0, 819.0, 44.0, 20.0, 17.0, 13.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7543525695800781, -0.7367324829101562, -0.7191123962402344, -0.7014923095703125, -0.6838722229003906, -0.6662521362304688, -0.6486320495605469, -0.631011962890625, -0.6133918762207031, -0.5957717895507812, -0.5781517028808594, -0.5605316162109375, -0.5429115295410156, -0.5252914428710938, -0.5076713562011719, -0.49005126953125, -0.4724311828613281, -0.45481109619140625, -0.4371910095214844, -0.4195709228515625, -0.4019508361816406, -0.38433074951171875, -0.3667106628417969, -0.349090576171875, -0.3314704895019531, -0.31385040283203125, -0.2962303161621094, -0.2786102294921875, -0.2609901428222656, -0.24337005615234375, -0.22574996948242188, -0.2081298828125, -0.19050979614257812, -0.17288970947265625, -0.15526962280273438, -0.1376495361328125, -0.12002944946289062, -0.10240936279296875, -0.08478927612304688, -0.067169189453125, -0.049549102783203125, -0.03192901611328125, -0.014308929443359375, 0.0033111572265625, 0.020931243896484375, 0.03855133056640625, 0.056171417236328125, 0.07379150390625, 0.09141159057617188, 0.10903167724609375, 0.12665176391601562, 0.1442718505859375, 0.16189193725585938, 0.17951202392578125, 0.19713211059570312, 0.214752197265625, 0.23237228393554688, 0.24999237060546875, 0.2676124572753906, 0.2852325439453125, 0.3028526306152344, 0.32047271728515625, 0.3380928039550781, 0.355712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 7.0, 2.0, 9.0, 21.0, 16.0, 27.0, 41.0, 44.0, 73.0, 102.0, 123.0, 182.0, 274.0, 417.0, 630.0, 921.0, 1374.0, 2149.0, 3589.0, 5943.0, 9665.0, 16955.0, 32085.0, 71849.0, 355580.0, 397627.0, 73494.0, 32439.0, 16800.0, 9871.0, 5989.0, 3587.0, 2274.0, 1506.0, 945.0, 635.0, 373.0, 279.0, 214.0, 133.0, 103.0, 68.0, 40.0, 17.0, 18.0, 26.0, 9.0, 8.0, 10.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.59814453125, -0.5800247192382812, -0.5619049072265625, -0.5437850952148438, -0.525665283203125, -0.5075454711914062, -0.4894256591796875, -0.47130584716796875, -0.45318603515625, -0.43506622314453125, -0.4169464111328125, -0.39882659912109375, -0.380706787109375, -0.36258697509765625, -0.3444671630859375, -0.32634735107421875, -0.3082275390625, -0.29010772705078125, -0.2719879150390625, -0.25386810302734375, -0.235748291015625, -0.21762847900390625, -0.1995086669921875, -0.18138885498046875, -0.16326904296875, -0.14514923095703125, -0.1270294189453125, -0.10890960693359375, -0.090789794921875, -0.07266998291015625, -0.0545501708984375, -0.03643035888671875, -0.018310546875, -0.00019073486328125, 0.0179290771484375, 0.03604888916015625, 0.054168701171875, 0.07228851318359375, 0.0904083251953125, 0.10852813720703125, 0.12664794921875, 0.14476776123046875, 0.1628875732421875, 0.18100738525390625, 0.199127197265625, 0.21724700927734375, 0.2353668212890625, 0.25348663330078125, 0.2716064453125, 0.28972625732421875, 0.3078460693359375, 0.32596588134765625, 0.344085693359375, 0.36220550537109375, 0.3803253173828125, 0.39844512939453125, 0.41656494140625, 0.43468475341796875, 0.4528045654296875, 0.47092437744140625, 0.489044189453125, 0.5071640014648438, 0.5252838134765625, 0.5434036254882812, 0.5615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 12.0, 12.0, 17.0, 19.0, 15.0, 18.0, 26.0, 23.0, 36.0, 37.0, 38.0, 30.0, 34.0, 38.0, 36.0, 33.0, 53.0, 43.0, 51.0, 42.0, 53.0, 32.0, 37.0, 40.0, 35.0, 19.0, 25.0, 21.0, 20.0, 20.0, 17.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.63134765625, -0.6109695434570312, -0.5905914306640625, -0.5702133178710938, -0.549835205078125, -0.5294570922851562, -0.5090789794921875, -0.48870086669921875, -0.46832275390625, -0.44794464111328125, -0.4275665283203125, -0.40718841552734375, -0.386810302734375, -0.36643218994140625, -0.3460540771484375, -0.32567596435546875, -0.3052978515625, -0.28491973876953125, -0.2645416259765625, -0.24416351318359375, -0.223785400390625, -0.20340728759765625, -0.1830291748046875, -0.16265106201171875, -0.14227294921875, -0.12189483642578125, -0.1015167236328125, -0.08113861083984375, -0.060760498046875, -0.04038238525390625, -0.0200042724609375, 0.00037384033203125, 0.020751953125, 0.04113006591796875, 0.0615081787109375, 0.08188629150390625, 0.102264404296875, 0.12264251708984375, 0.1430206298828125, 0.16339874267578125, 0.18377685546875, 0.20415496826171875, 0.2245330810546875, 0.24491119384765625, 0.265289306640625, 0.28566741943359375, 0.3060455322265625, 0.32642364501953125, 0.3468017578125, 0.36717987060546875, 0.3875579833984375, 0.40793609619140625, 0.428314208984375, 0.44869232177734375, 0.4690704345703125, 0.48944854736328125, 0.50982666015625, 0.5302047729492188, 0.5505828857421875, 0.5709609985351562, 0.591339111328125, 0.6117172241210938, 0.6320953369140625, 0.6524734497070312, 0.6728515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 9.0, 20.0, 52.0, 131.0, 489.0, 4846.0, 1032920.0, 9245.0, 548.0, 151.0, 69.0, 25.0, 17.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05799531936645508, -0.056664466857910156, -0.055333614349365234, -0.05400276184082031, -0.05267190933227539, -0.05134105682373047, -0.05001020431518555, -0.048679351806640625, -0.0473484992980957, -0.04601764678955078, -0.04468679428100586, -0.04335594177246094, -0.042025089263916016, -0.040694236755371094, -0.03936338424682617, -0.03803253173828125, -0.03670167922973633, -0.035370826721191406, -0.034039974212646484, -0.03270912170410156, -0.03137826919555664, -0.03004741668701172, -0.028716564178466797, -0.027385711669921875, -0.026054859161376953, -0.02472400665283203, -0.02339315414428711, -0.022062301635742188, -0.020731449127197266, -0.019400596618652344, -0.018069744110107422, -0.0167388916015625, -0.015408039093017578, -0.014077186584472656, -0.012746334075927734, -0.011415481567382812, -0.01008462905883789, -0.008753776550292969, -0.007422924041748047, -0.006092071533203125, -0.004761219024658203, -0.0034303665161132812, -0.0020995140075683594, -0.0007686614990234375, 0.0005621910095214844, 0.0018930435180664062, 0.003223896026611328, 0.00455474853515625, 0.005885601043701172, 0.007216453552246094, 0.008547306060791016, 0.009878158569335938, 0.01120901107788086, 0.012539863586425781, 0.013870716094970703, 0.015201568603515625, 0.016532421112060547, 0.01786327362060547, 0.01919412612915039, 0.020524978637695312, 0.021855831146240234, 0.023186683654785156, 0.024517536163330078, 0.025848388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 28.0, 31.0, 65.0, 88.0, 117.0, 126.0, 103.0, 117.0, 78.0, 73.0, 40.0, 34.0, 17.0, 14.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.350688636302948e-06, -6.144866347312927e-06, -5.9390440583229065e-06, -5.733221769332886e-06, -5.527399480342865e-06, -5.321577191352844e-06, -5.1157549023628235e-06, -4.909932613372803e-06, -4.704110324382782e-06, -4.498288035392761e-06, -4.2924657464027405e-06, -4.08664345741272e-06, -3.880821168422699e-06, -3.6749988794326782e-06, -3.4691765904426575e-06, -3.2633543014526367e-06, -3.057532012462616e-06, -2.8517097234725952e-06, -2.6458874344825745e-06, -2.4400651454925537e-06, -2.234242856502533e-06, -2.028420567512512e-06, -1.8225982785224915e-06, -1.6167759895324707e-06, -1.41095370054245e-06, -1.2051314115524292e-06, -9.993091225624084e-07, -7.934868335723877e-07, -5.876645445823669e-07, -3.818422555923462e-07, -1.7601996660232544e-07, 2.9802322387695312e-08, 2.3562461137771606e-07, 4.414469003677368e-07, 6.472691893577576e-07, 8.530914783477783e-07, 1.058913767337799e-06, 1.2647360563278198e-06, 1.4705583453178406e-06, 1.6763806343078613e-06, 1.882202923297882e-06, 2.088025212287903e-06, 2.2938475012779236e-06, 2.4996697902679443e-06, 2.705492079257965e-06, 2.911314368247986e-06, 3.1171366572380066e-06, 3.3229589462280273e-06, 3.528781235218048e-06, 3.734603524208069e-06, 3.94042581319809e-06, 4.14624810218811e-06, 4.352070391178131e-06, 4.557892680168152e-06, 4.763714969158173e-06, 4.969537258148193e-06, 5.175359547138214e-06, 5.381181836128235e-06, 5.587004125118256e-06, 5.792826414108276e-06, 5.998648703098297e-06, 6.204470992088318e-06, 6.410293281078339e-06, 6.616115570068359e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 11.0, 15.0, 18.0, 17.0, 28.0, 74.0, 117.0, 230.0, 530.0, 1195.0, 3029.0, 10624.0, 76234.0, 911645.0, 33979.0, 6932.0, 2109.0, 876.0, 378.0, 199.0, 97.0, 61.0, 24.0, 22.0, 17.0, 10.0, 12.0, 8.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006771087646484375, -0.006514012813568115, -0.0062569379806518555, -0.005999863147735596, -0.005742788314819336, -0.005485713481903076, -0.005228638648986816, -0.004971563816070557, -0.004714488983154297, -0.004457414150238037, -0.004200339317321777, -0.003943264484405518, -0.003686189651489258, -0.003429114818572998, -0.0031720399856567383, -0.0029149651527404785, -0.0026578903198242188, -0.002400815486907959, -0.0021437406539916992, -0.0018866658210754395, -0.0016295909881591797, -0.00137251615524292, -0.0011154413223266602, -0.0008583664894104004, -0.0006012916564941406, -0.00034421682357788086, -8.71419906616211e-05, 0.00016993284225463867, 0.00042700767517089844, 0.0006840825080871582, 0.000941157341003418, 0.0011982321739196777, 0.0014553070068359375, 0.0017123818397521973, 0.001969456672668457, 0.002226531505584717, 0.0024836063385009766, 0.0027406811714172363, 0.002997756004333496, 0.003254830837249756, 0.0035119056701660156, 0.0037689805030822754, 0.004026055335998535, 0.004283130168914795, 0.004540205001831055, 0.0047972798347473145, 0.005054354667663574, 0.005311429500579834, 0.005568504333496094, 0.0058255791664123535, 0.006082653999328613, 0.006339728832244873, 0.006596803665161133, 0.006853878498077393, 0.007110953330993652, 0.007368028163909912, 0.007625102996826172, 0.007882177829742432, 0.008139252662658691, 0.008396327495574951, 0.008653402328491211, 0.00891047716140747, 0.00916755199432373, 0.00942462682723999, 0.00968170166015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 7.0, 12.0, 8.0, 13.0, 25.0, 36.0, 61.0, 111.0, 208.0, 233.0, 117.0, 63.0, 32.0, 24.0, 21.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0107574462890625, -0.010528534650802612, -0.010299623012542725, -0.010070711374282837, -0.00984179973602295, -0.009612888097763062, -0.009383976459503174, -0.009155064821243286, -0.008926153182983398, -0.00869724154472351, -0.008468329906463623, -0.008239418268203735, -0.008010506629943848, -0.00778159499168396, -0.007552683353424072, -0.007323771715164185, -0.007094860076904297, -0.006865948438644409, -0.0066370368003845215, -0.006408125162124634, -0.006179213523864746, -0.005950301885604858, -0.005721390247344971, -0.005492478609085083, -0.005263566970825195, -0.005034655332565308, -0.00480574369430542, -0.004576832056045532, -0.0043479204177856445, -0.004119008779525757, -0.003890097141265869, -0.0036611855030059814, -0.0034322738647460938, -0.003203362226486206, -0.0029744505882263184, -0.0027455389499664307, -0.002516627311706543, -0.0022877156734466553, -0.0020588040351867676, -0.0018298923969268799, -0.0016009807586669922, -0.0013720691204071045, -0.0011431574821472168, -0.0009142458438873291, -0.0006853342056274414, -0.0004564225673675537, -0.00022751092910766602, 1.4007091522216797e-06, 0.00023031234741210938, 0.00045922398567199707, 0.0006881356239318848, 0.0009170472621917725, 0.0011459589004516602, 0.0013748705387115479, 0.0016037821769714355, 0.0018326938152313232, 0.002061605453491211, 0.0022905170917510986, 0.0025194287300109863, 0.002748340368270874, 0.0029772520065307617, 0.0032061636447906494, 0.003435075283050537, 0.003663986921310425, 0.0038928985595703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 14.0, 17.0, 58.0, 483.0, 295.0, 81.0, 31.0, 17.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.689971923828125, -22.160972595214844, -21.631973266601562, -21.10297203063965, -20.573972702026367, -20.044973373413086, -19.515974044799805, -18.986974716186523, -18.45797348022461, -17.928974151611328, -17.399974822998047, -16.870973587036133, -16.34197425842285, -15.81297492980957, -15.283975601196289, -14.754976272583008, -14.225976943969727, -13.696977615356445, -13.167977333068848, -12.638978004455566, -12.109977722167969, -11.580978393554688, -11.051979064941406, -10.522979736328125, -9.993979454040527, -9.464980125427246, -8.935979843139648, -8.406980514526367, -7.877980709075928, -7.348980903625488, -6.819981575012207, -6.290981769561768, -5.761983871459961, -5.2329840660095215, -4.703984260559082, -4.174984931945801, -3.6459851264953613, -3.116985321044922, -2.5879857540130615, -2.058986186981201, -1.5299863815307617, -1.0009866952896118, -0.4719870090484619, 0.05701267719268799, 0.5860123634338379, 1.1150121688842773, 1.6440117359161377, 2.173011302947998, 2.7020111083984375, 3.231010913848877, 3.7600104808807373, 4.289010047912598, 4.818009853363037, 5.347009658813477, 5.876008987426758, 6.405008792877197, 6.934008598327637, 7.463008403778076, 7.992008209228516, 8.521007537841797, 9.050006866455078, 9.579007148742676, 10.108006477355957, 10.637006759643555, 11.166006088256836]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 16.0, 28.0, 37.0, 70.0, 99.0, 133.0, 177.0, 160.0, 107.0, 54.0, 38.0, 18.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.262331008911133, -8.761574745178223, -8.260818481445312, -7.760062217712402, -7.259305953979492, -6.758549690246582, -6.25779390335083, -5.75703763961792, -5.25628137588501, -4.7555251121521, -4.2547688484191895, -3.7540128231048584, -3.2532565593719482, -2.752500295639038, -2.251744270324707, -1.7509880065917969, -1.2502317428588867, -0.7494755387306213, -0.24871933460235596, 0.25203680992126465, 0.7527930736541748, 1.253549337387085, 1.754305362701416, 2.255061626434326, 2.7558178901672363, 3.2565741539001465, 3.7573304176330566, 4.258086204528809, 4.758842468261719, 5.259598731994629, 5.760354995727539, 6.261111259460449, 6.761867523193359, 7.2626237869262695, 7.76338005065918, 8.26413631439209, 8.764892578125, 9.26564884185791, 9.76640510559082, 10.267160415649414, 10.76791763305664, 11.26867389678955, 11.769430160522461, 12.270186424255371, 12.770942687988281, 13.271698951721191, 13.772455215454102, 14.273210525512695, 14.773966789245605, 15.274723052978516, 15.775479316711426, 16.276235580444336, 16.77699089050293, 17.277748107910156, 17.77850341796875, 18.279260635375977, 18.78001594543457, 19.280771255493164, 19.78152847290039, 20.282283782958984, 20.78304100036621, 21.283796310424805, 21.78455352783203, 22.285308837890625, 22.78606605529785]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 11.0, 8.0, 23.0, 44.0, 54.0, 103.0, 163.0, 350.0, 999.0, 11295.0, 4176424.0, 3838.0, 674.0, 180.0, 58.0, 27.0, 10.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.9375, -78.09130859375, -76.2451171875, -74.39892578125, -72.552734375, -70.70654296875, -68.8603515625, -67.01416015625, -65.16796875, -63.32177734375, -61.4755859375, -59.62939453125, -57.783203125, -55.93701171875, -54.0908203125, -52.24462890625, -50.3984375, -48.55224609375, -46.7060546875, -44.85986328125, -43.013671875, -41.16748046875, -39.3212890625, -37.47509765625, -35.62890625, -33.78271484375, -31.9365234375, -30.09033203125, -28.244140625, -26.39794921875, -24.5517578125, -22.70556640625, -20.859375, -19.01318359375, -17.1669921875, -15.32080078125, -13.474609375, -11.62841796875, -9.7822265625, -7.93603515625, -6.08984375, -4.24365234375, -2.3974609375, -0.55126953125, 1.294921875, 3.14111328125, 4.9873046875, 6.83349609375, 8.6796875, 10.52587890625, 12.3720703125, 14.21826171875, 16.064453125, 17.91064453125, 19.7568359375, 21.60302734375, 23.44921875, 25.29541015625, 27.1416015625, 28.98779296875, 30.833984375, 32.68017578125, 34.5263671875, 36.37255859375, 38.21875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 49.0, 821.0, 26.0, 20.0, 16.0, 7.0, 6.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7322006225585938, -0.7148895263671875, -0.6975784301757812, -0.680267333984375, -0.6629562377929688, -0.6456451416015625, -0.6283340454101562, -0.61102294921875, -0.5937118530273438, -0.5764007568359375, -0.5590896606445312, -0.541778564453125, -0.5244674682617188, -0.5071563720703125, -0.48984527587890625, -0.4725341796875, -0.45522308349609375, -0.4379119873046875, -0.42060089111328125, -0.403289794921875, -0.38597869873046875, -0.3686676025390625, -0.35135650634765625, -0.33404541015625, -0.31673431396484375, -0.2994232177734375, -0.28211212158203125, -0.264801025390625, -0.24748992919921875, -0.2301788330078125, -0.21286773681640625, -0.195556640625, -0.17824554443359375, -0.1609344482421875, -0.14362335205078125, -0.126312255859375, -0.10900115966796875, -0.0916900634765625, -0.07437896728515625, -0.05706787109375, -0.03975677490234375, -0.0224456787109375, -0.00513458251953125, 0.012176513671875, 0.02948760986328125, 0.0467987060546875, 0.06410980224609375, 0.0814208984375, 0.09873199462890625, 0.1160430908203125, 0.13335418701171875, 0.150665283203125, 0.16797637939453125, 0.1852874755859375, 0.20259857177734375, 0.21990966796875, 0.23722076416015625, 0.2545318603515625, 0.27184295654296875, 0.289154052734375, 0.30646514892578125, 0.3237762451171875, 0.34108734130859375, 0.3583984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 17.0, 10.0, 23.0, 36.0, 37.0, 69.0, 88.0, 150.0, 310.0, 554.0, 1021.0, 2145.0, 4729.0, 11657.0, 36460.0, 3933214.0, 159742.0, 27129.0, 9175.0, 3925.0, 1732.0, 900.0, 478.0, 252.0, 138.0, 84.0, 49.0, 39.0, 31.0, 17.0, 15.0, 15.0, 14.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.103515625, -2.01904296875, -1.9345703125, -1.85009765625, -1.765625, -1.68115234375, -1.5966796875, -1.51220703125, -1.427734375, -1.34326171875, -1.2587890625, -1.17431640625, -1.08984375, -1.00537109375, -0.9208984375, -0.83642578125, -0.751953125, -0.66748046875, -0.5830078125, -0.49853515625, -0.4140625, -0.32958984375, -0.2451171875, -0.16064453125, -0.076171875, 0.00830078125, 0.0927734375, 0.17724609375, 0.26171875, 0.34619140625, 0.4306640625, 0.51513671875, 0.599609375, 0.68408203125, 0.7685546875, 0.85302734375, 0.9375, 1.02197265625, 1.1064453125, 1.19091796875, 1.275390625, 1.35986328125, 1.4443359375, 1.52880859375, 1.61328125, 1.69775390625, 1.7822265625, 1.86669921875, 1.951171875, 2.03564453125, 2.1201171875, 2.20458984375, 2.2890625, 2.37353515625, 2.4580078125, 2.54248046875, 2.626953125, 2.71142578125, 2.7958984375, 2.88037109375, 2.96484375, 3.04931640625, 3.1337890625, 3.21826171875, 3.302734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 14.0, 12.0, 12.0, 19.0, 21.0, 20.0, 26.0, 35.0, 27.0, 32.0, 3558.0, 68.0, 36.0, 30.0, 22.0, 17.0, 17.0, 12.0, 15.0, 9.0, 12.0, 7.0, 7.0, 8.0, 4.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.438720703125, -0.4274101257324219, -0.41609954833984375, -0.4047889709472656, -0.3934783935546875, -0.3821678161621094, -0.37085723876953125, -0.3595466613769531, -0.348236083984375, -0.3369255065917969, -0.32561492919921875, -0.3143043518066406, -0.3029937744140625, -0.2916831970214844, -0.28037261962890625, -0.2690620422363281, -0.25775146484375, -0.24644088745117188, -0.23513031005859375, -0.22381973266601562, -0.2125091552734375, -0.20119857788085938, -0.18988800048828125, -0.17857742309570312, -0.167266845703125, -0.15595626831054688, -0.14464569091796875, -0.13333511352539062, -0.1220245361328125, -0.11071395874023438, -0.09940338134765625, -0.08809280395507812, -0.0767822265625, -0.06547164916992188, -0.05416107177734375, -0.042850494384765625, -0.0315399169921875, -0.020229339599609375, -0.00891876220703125, 0.002391815185546875, 0.013702392578125, 0.025012969970703125, 0.03632354736328125, 0.047634124755859375, 0.0589447021484375, 0.07025527954101562, 0.08156585693359375, 0.09287643432617188, 0.10418701171875, 0.11549758911132812, 0.12680816650390625, 0.13811874389648438, 0.1494293212890625, 0.16073989868164062, 0.17205047607421875, 0.18336105346679688, 0.194671630859375, 0.20598220825195312, 0.21729278564453125, 0.22860336303710938, 0.2399139404296875, 0.2512245178222656, 0.26253509521484375, 0.2738456726074219, 0.28515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 957.0, 42.0, 8.0, 2.0, 0.0, 1.0], "bins": [-30.43301010131836, -29.91424560546875, -29.39548110961914, -28.87671661376953, -28.357952117919922, -27.839187622070312, -27.320423126220703, -26.801658630371094, -26.282894134521484, -25.764129638671875, -25.245365142822266, -24.726600646972656, -24.207836151123047, -23.689071655273438, -23.170307159423828, -22.65154266357422, -22.132776260375977, -21.614011764526367, -21.095247268676758, -20.57648277282715, -20.05771827697754, -19.53895378112793, -19.02018928527832, -18.501422882080078, -17.98265838623047, -17.46389389038086, -16.94512939453125, -16.42636489868164, -15.907600402832031, -15.388835906982422, -14.870070457458496, -14.351305961608887, -13.832544326782227, -13.313779830932617, -12.795015335083008, -12.276250839233398, -11.757486343383789, -11.23872184753418, -10.719956398010254, -10.201191902160645, -9.682427406311035, -9.163662910461426, -8.644898414611816, -8.126133918762207, -7.6073689460754395, -7.08860445022583, -6.5698394775390625, -6.051074981689453, -5.532310485839844, -5.013545989990234, -4.494781494140625, -3.9760165214538574, -3.457252025604248, -2.9384875297546387, -2.41972279548645, -1.9009580612182617, -1.3821935653686523, -0.8634289503097534, -0.3446643352508545, 0.17410027980804443, 0.6928648948669434, 1.2116293907165527, 1.7303941249847412, 2.2491588592529297, 2.767923355102539]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 32.0, 45.0, 67.0, 124.0, 130.0, 135.0, 126.0, 95.0, 72.0, 48.0, 33.0, 14.0, 13.0, 3.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4376091957092285, -1.3694449663162231, -1.3012807369232178, -1.233116626739502, -1.1649523973464966, -1.0967881679534912, -1.0286240577697754, -0.96045982837677, -0.8922955989837646, -0.8241313695907593, -0.7559671998023987, -0.6878030300140381, -0.6196388006210327, -0.5514745712280273, -0.48331040143966675, -0.41514620184898376, -0.3469820022583008, -0.2788178026676178, -0.21065360307693481, -0.14248940348625183, -0.07432520389556885, -0.006161004304885864, 0.06200319528579712, 0.1301673948764801, 0.19833159446716309, 0.26649579405784607, 0.33465999364852905, 0.40282419323921204, 0.470988392829895, 0.5391526222229004, 0.607316792011261, 0.6754809617996216, 0.743645191192627, 0.8118094205856323, 0.8799735903739929, 0.9481377601623535, 1.0163019895553589, 1.0844662189483643, 1.15263032913208, 1.2207945585250854, 1.2889587879180908, 1.3571230173110962, 1.4252872467041016, 1.4934513568878174, 1.5616155862808228, 1.6297798156738281, 1.697943925857544, 1.7661081552505493, 1.8342723846435547, 1.90243661403656, 1.9706008434295654, 2.0387649536132812, 2.106929302215576, 2.175093412399292, 2.243257522583008, 2.3114218711853027, 2.3795859813690186, 2.4477500915527344, 2.5159144401550293, 2.584078550338745, 2.652242660522461, 2.720407009124756, 2.7885711193084717, 2.8567354679107666, 2.9248995780944824]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 9.0, 11.0, 20.0, 27.0, 20.0, 23.0, 53.0, 67.0, 96.0, 164.0, 283.0, 461.0, 977.0, 2843.0, 13242.0, 995276.0, 27853.0, 4273.0, 1341.0, 582.0, 313.0, 193.0, 150.0, 62.0, 53.0, 38.0, 20.0, 24.0, 17.0, 12.0, 17.0, 5.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0625, -4.9205322265625, -4.778564453125, -4.6365966796875, -4.49462890625, -4.3526611328125, -4.210693359375, -4.0687255859375, -3.9267578125, -3.7847900390625, -3.642822265625, -3.5008544921875, -3.35888671875, -3.2169189453125, -3.074951171875, -2.9329833984375, -2.791015625, -2.6490478515625, -2.507080078125, -2.3651123046875, -2.22314453125, -2.0811767578125, -1.939208984375, -1.7972412109375, -1.6552734375, -1.5133056640625, -1.371337890625, -1.2293701171875, -1.08740234375, -0.9454345703125, -0.803466796875, -0.6614990234375, -0.51953125, -0.3775634765625, -0.235595703125, -0.0936279296875, 0.04833984375, 0.1903076171875, 0.332275390625, 0.4742431640625, 0.6162109375, 0.7581787109375, 0.900146484375, 1.0421142578125, 1.18408203125, 1.3260498046875, 1.468017578125, 1.6099853515625, 1.751953125, 1.8939208984375, 2.035888671875, 2.1778564453125, 2.31982421875, 2.4617919921875, 2.603759765625, 2.7457275390625, 2.8876953125, 3.0296630859375, 3.171630859375, 3.3135986328125, 3.45556640625, 3.5975341796875, 3.739501953125, 3.8814697265625, 4.0234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 19.0, 35.0, 491.0, 382.0, 19.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7177467346191406, -0.7006301879882812, -0.6835136413574219, -0.6663970947265625, -0.6492805480957031, -0.6321640014648438, -0.6150474548339844, -0.597930908203125, -0.5808143615722656, -0.5636978149414062, -0.5465812683105469, -0.5294647216796875, -0.5123481750488281, -0.49523162841796875, -0.4781150817871094, -0.46099853515625, -0.4438819885253906, -0.42676544189453125, -0.4096488952636719, -0.3925323486328125, -0.3754158020019531, -0.35829925537109375, -0.3411827087402344, -0.324066162109375, -0.3069496154785156, -0.28983306884765625, -0.2727165222167969, -0.2555999755859375, -0.23848342895507812, -0.22136688232421875, -0.20425033569335938, -0.1871337890625, -0.17001724243164062, -0.15290069580078125, -0.13578414916992188, -0.1186676025390625, -0.10155105590820312, -0.08443450927734375, -0.06731796264648438, -0.050201416015625, -0.033084869384765625, -0.01596832275390625, 0.001148223876953125, 0.0182647705078125, 0.035381317138671875, 0.05249786376953125, 0.06961441040039062, 0.08673095703125, 0.10384750366210938, 0.12096405029296875, 0.13808059692382812, 0.1551971435546875, 0.17231369018554688, 0.18943023681640625, 0.20654678344726562, 0.223663330078125, 0.24077987670898438, 0.25789642333984375, 0.2750129699707031, 0.2921295166015625, 0.3092460632324219, 0.32636260986328125, 0.3434791564941406, 0.360595703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 13.0, 14.0, 15.0, 30.0, 33.0, 44.0, 78.0, 114.0, 218.0, 433.0, 1162.0, 4514.0, 28276.0, 736721.0, 254946.0, 17060.0, 3081.0, 911.0, 370.0, 177.0, 103.0, 68.0, 39.0, 30.0, 26.0, 20.0, 11.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5523223876953125, -1.492340087890625, -1.4323577880859375, -1.37237548828125, -1.3123931884765625, -1.252410888671875, -1.1924285888671875, -1.1324462890625, -1.0724639892578125, -1.012481689453125, -0.9524993896484375, -0.89251708984375, -0.8325347900390625, -0.772552490234375, -0.7125701904296875, -0.652587890625, -0.5926055908203125, -0.532623291015625, -0.4726409912109375, -0.41265869140625, -0.3526763916015625, -0.292694091796875, -0.2327117919921875, -0.1727294921875, -0.1127471923828125, -0.052764892578125, 0.0072174072265625, 0.06719970703125, 0.1271820068359375, 0.187164306640625, 0.2471466064453125, 0.30712890625, 0.3671112060546875, 0.427093505859375, 0.4870758056640625, 0.54705810546875, 0.6070404052734375, 0.667022705078125, 0.7270050048828125, 0.7869873046875, 0.8469696044921875, 0.906951904296875, 0.9669342041015625, 1.02691650390625, 1.0868988037109375, 1.146881103515625, 1.2068634033203125, 1.266845703125, 1.3268280029296875, 1.386810302734375, 1.4467926025390625, 1.50677490234375, 1.5667572021484375, 1.626739501953125, 1.6867218017578125, 1.7467041015625, 1.8066864013671875, 1.866668701171875, 1.9266510009765625, 1.98663330078125, 2.0466156005859375, 2.106597900390625, 2.1665802001953125, 2.2265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 17.0, 22.0, 19.0, 27.0, 41.0, 43.0, 35.0, 51.0, 48.0, 59.0, 50.0, 50.0, 56.0, 65.0, 50.0, 48.0, 37.0, 41.0, 36.0, 37.0, 26.0, 29.0, 22.0, 15.0, 12.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67626953125, -0.6580314636230469, -0.6397933959960938, -0.6215553283691406, -0.6033172607421875, -0.5850791931152344, -0.5668411254882812, -0.5486030578613281, -0.530364990234375, -0.5121269226074219, -0.49388885498046875, -0.4756507873535156, -0.4574127197265625, -0.4391746520996094, -0.42093658447265625, -0.4026985168457031, -0.38446044921875, -0.3662223815917969, -0.34798431396484375, -0.3297462463378906, -0.3115081787109375, -0.2932701110839844, -0.27503204345703125, -0.2567939758300781, -0.238555908203125, -0.22031784057617188, -0.20207977294921875, -0.18384170532226562, -0.1656036376953125, -0.14736557006835938, -0.12912750244140625, -0.11088943481445312, -0.0926513671875, -0.07441329956054688, -0.05617523193359375, -0.037937164306640625, -0.0196990966796875, -0.001461029052734375, 0.01677703857421875, 0.035015106201171875, 0.053253173828125, 0.07149124145507812, 0.08972930908203125, 0.10796737670898438, 0.1262054443359375, 0.14444351196289062, 0.16268157958984375, 0.18091964721679688, 0.19915771484375, 0.21739578247070312, 0.23563385009765625, 0.2538719177246094, 0.2721099853515625, 0.2903480529785156, 0.30858612060546875, 0.3268241882324219, 0.345062255859375, 0.3633003234863281, 0.38153839111328125, 0.3997764587402344, 0.4180145263671875, 0.4362525939941406, 0.45449066162109375, 0.4727287292480469, 0.490966796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 12.0, 27.0, 32.0, 41.0, 85.0, 146.0, 336.0, 1108.0, 5489.0, 65537.0, 930444.0, 39715.0, 4029.0, 946.0, 281.0, 104.0, 79.0, 53.0, 20.0, 16.0, 20.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.0924224853515625, -0.089813232421875, -0.0872039794921875, -0.0845947265625, -0.0819854736328125, -0.079376220703125, -0.0767669677734375, -0.07415771484375, -0.0715484619140625, -0.068939208984375, -0.0663299560546875, -0.063720703125, -0.0611114501953125, -0.058502197265625, -0.0558929443359375, -0.05328369140625, -0.0506744384765625, -0.048065185546875, -0.0454559326171875, -0.0428466796875, -0.0402374267578125, -0.037628173828125, -0.0350189208984375, -0.03240966796875, -0.0298004150390625, -0.027191162109375, -0.0245819091796875, -0.02197265625, -0.0193634033203125, -0.016754150390625, -0.0141448974609375, -0.01153564453125, -0.0089263916015625, -0.006317138671875, -0.0037078857421875, -0.0010986328125, 0.0015106201171875, 0.004119873046875, 0.0067291259765625, 0.00933837890625, 0.0119476318359375, 0.014556884765625, 0.0171661376953125, 0.019775390625, 0.0223846435546875, 0.024993896484375, 0.0276031494140625, 0.03021240234375, 0.0328216552734375, 0.035430908203125, 0.0380401611328125, 0.0406494140625, 0.0432586669921875, 0.045867919921875, 0.0484771728515625, 0.05108642578125, 0.0536956787109375, 0.056304931640625, 0.0589141845703125, 0.0615234375, 0.0641326904296875, 0.066741943359375, 0.0693511962890625, 0.07196044921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 9.0, 8.0, 14.0, 23.0, 32.0, 26.0, 43.0, 76.0, 108.0, 82.0, 145.0, 113.0, 76.0, 73.0, 60.0, 37.0, 21.0, 14.0, 10.0, 10.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.810761988162994e-06, -6.588175892829895e-06, -6.365589797496796e-06, -6.143003702163696e-06, -5.920417606830597e-06, -5.6978315114974976e-06, -5.475245416164398e-06, -5.252659320831299e-06, -5.0300732254981995e-06, -4.8074871301651e-06, -4.584901034832001e-06, -4.362314939498901e-06, -4.139728844165802e-06, -3.917142748832703e-06, -3.6945566534996033e-06, -3.471970558166504e-06, -3.2493844628334045e-06, -3.026798367500305e-06, -2.804212272167206e-06, -2.5816261768341064e-06, -2.359040081501007e-06, -2.1364539861679077e-06, -1.9138678908348083e-06, -1.691281795501709e-06, -1.4686957001686096e-06, -1.2461096048355103e-06, -1.0235235095024109e-06, -8.009374141693115e-07, -5.783513188362122e-07, -3.557652235031128e-07, -1.3317912817001343e-07, 8.940696716308594e-08, 3.119930624961853e-07, 5.345791578292847e-07, 7.57165253162384e-07, 9.797513484954834e-07, 1.2023374438285828e-06, 1.4249235391616821e-06, 1.6475096344947815e-06, 1.8700957298278809e-06, 2.0926818251609802e-06, 2.3152679204940796e-06, 2.537854015827179e-06, 2.7604401111602783e-06, 2.9830262064933777e-06, 3.205612301826477e-06, 3.4281983971595764e-06, 3.6507844924926758e-06, 3.873370587825775e-06, 4.0959566831588745e-06, 4.318542778491974e-06, 4.541128873825073e-06, 4.763714969158173e-06, 4.986301064491272e-06, 5.208887159824371e-06, 5.431473255157471e-06, 5.65405935049057e-06, 5.8766454458236694e-06, 6.099231541156769e-06, 6.321817636489868e-06, 6.5444037318229675e-06, 6.766989827156067e-06, 6.989575922489166e-06, 7.212162017822266e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 9.0, 10.0, 18.0, 15.0, 45.0, 57.0, 88.0, 228.0, 541.0, 1417.0, 5807.0, 60901.0, 945925.0, 27403.0, 4069.0, 1146.0, 413.0, 193.0, 80.0, 55.0, 44.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.0857391357421875, -0.082916259765625, -0.0800933837890625, -0.0772705078125, -0.0744476318359375, -0.071624755859375, -0.0688018798828125, -0.06597900390625, -0.0631561279296875, -0.060333251953125, -0.0575103759765625, -0.0546875, -0.0518646240234375, -0.049041748046875, -0.0462188720703125, -0.04339599609375, -0.0405731201171875, -0.037750244140625, -0.0349273681640625, -0.0321044921875, -0.0292816162109375, -0.026458740234375, -0.0236358642578125, -0.02081298828125, -0.0179901123046875, -0.015167236328125, -0.0123443603515625, -0.009521484375, -0.0066986083984375, -0.003875732421875, -0.0010528564453125, 0.00177001953125, 0.0045928955078125, 0.007415771484375, 0.0102386474609375, 0.0130615234375, 0.0158843994140625, 0.018707275390625, 0.0215301513671875, 0.02435302734375, 0.0271759033203125, 0.029998779296875, 0.0328216552734375, 0.03564453125, 0.0384674072265625, 0.041290283203125, 0.0441131591796875, 0.04693603515625, 0.0497589111328125, 0.052581787109375, 0.0554046630859375, 0.0582275390625, 0.0610504150390625, 0.063873291015625, 0.0666961669921875, 0.06951904296875, 0.0723419189453125, 0.075164794921875, 0.0779876708984375, 0.080810546875, 0.0836334228515625, 0.086456298828125, 0.0892791748046875, 0.09210205078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 15.0, 10.0, 25.0, 37.0, 50.0, 75.0, 87.0, 138.0, 119.0, 124.0, 82.0, 56.0, 38.0, 28.0, 14.0, 16.0, 7.0, 11.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028110027313232422, -0.027213096618652344, -0.026316165924072266, -0.025419235229492188, -0.02452230453491211, -0.02362537384033203, -0.022728443145751953, -0.021831512451171875, -0.020934581756591797, -0.02003765106201172, -0.01914072036743164, -0.018243789672851562, -0.017346858978271484, -0.016449928283691406, -0.015552997589111328, -0.01465606689453125, -0.013759136199951172, -0.012862205505371094, -0.011965274810791016, -0.011068344116210938, -0.01017141342163086, -0.009274482727050781, -0.008377552032470703, -0.007480621337890625, -0.006583690643310547, -0.005686759948730469, -0.004789829254150391, -0.0038928985595703125, -0.0029959678649902344, -0.0020990371704101562, -0.0012021064758300781, -0.00030517578125, 0.0005917549133300781, 0.0014886856079101562, 0.0023856163024902344, 0.0032825469970703125, 0.004179477691650391, 0.005076408386230469, 0.005973339080810547, 0.006870269775390625, 0.007767200469970703, 0.008664131164550781, 0.00956106185913086, 0.010457992553710938, 0.011354923248291016, 0.012251853942871094, 0.013148784637451172, 0.01404571533203125, 0.014942646026611328, 0.015839576721191406, 0.016736507415771484, 0.017633438110351562, 0.01853036880493164, 0.01942729949951172, 0.020324230194091797, 0.021221160888671875, 0.022118091583251953, 0.02301502227783203, 0.02391195297241211, 0.024808883666992188, 0.025705814361572266, 0.026602745056152344, 0.027499675750732422, 0.0283966064453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 14.0, 160.0, 792.0, 34.0, 8.0, 2.0, 6.0], "bins": [-47.23650360107422, -46.43891906738281, -45.64133071899414, -44.843746185302734, -44.04615783691406, -43.248573303222656, -42.450984954833984, -41.65340042114258, -40.855812072753906, -40.0582275390625, -39.26063919067383, -38.46305465698242, -37.66546630859375, -36.867881774902344, -36.07029342651367, -35.272708892822266, -34.47512435913086, -33.67753982543945, -32.87995147705078, -32.082366943359375, -31.284778594970703, -30.487194061279297, -29.689607620239258, -28.89202117919922, -28.09443473815918, -27.29684829711914, -26.4992618560791, -25.701675415039062, -24.904090881347656, -24.106504440307617, -23.308917999267578, -22.51133155822754, -21.7137451171875, -20.91615867614746, -20.118572235107422, -19.320985794067383, -18.523399353027344, -17.725814819335938, -16.9282283782959, -16.13064193725586, -15.33305549621582, -14.535469055175781, -13.737882614135742, -12.94029712677002, -12.14271068572998, -11.345124244689941, -10.547538757324219, -9.74995231628418, -8.95236587524414, -8.154779434204102, -7.357193470001221, -6.55960750579834, -5.762021064758301, -4.964434623718262, -4.166848659515381, -3.3692626953125, -2.571676015853882, -1.7740898132324219, -0.9765036106109619, -0.17891740798950195, 0.618668794631958, 1.416254997253418, 2.213841199874878, 3.011427164077759, 3.809013605117798]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 12.0, 16.0, 25.0, 23.0, 37.0, 50.0, 61.0, 77.0, 74.0, 94.0, 86.0, 87.0, 84.0, 54.0, 51.0, 41.0, 34.0, 20.0, 22.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.451914310455322, -5.28645133972168, -5.120988845825195, -4.955526351928711, -4.790063381195068, -4.624600410461426, -4.459137916564941, -4.293675422668457, -4.1282124519348145, -3.962749719619751, -3.7972869873046875, -3.631824254989624, -3.4663615226745605, -3.300898790359497, -3.1354360580444336, -2.96997332572937, -2.8045105934143066, -2.639047861099243, -2.4735851287841797, -2.308122396469116, -2.1426596641540527, -1.9771969318389893, -1.8117341995239258, -1.6462714672088623, -1.4808087348937988, -1.3153460025787354, -1.1498832702636719, -0.9844205379486084, -0.8189578056335449, -0.6534950733184814, -0.48803234100341797, -0.3225696086883545, -0.1571063995361328, 0.008356332778930664, 0.17381906509399414, 0.3392817974090576, 0.5047445297241211, 0.6702072620391846, 0.835669994354248, 1.0011327266693115, 1.166595458984375, 1.3320581912994385, 1.497520923614502, 1.6629836559295654, 1.828446388244629, 1.9939091205596924, 2.159371852874756, 2.3248345851898193, 2.490297317504883, 2.6557600498199463, 2.8212227821350098, 2.9866855144500732, 3.1521482467651367, 3.3176109790802, 3.4830737113952637, 3.648536443710327, 3.8139991760253906, 3.979461908340454, 4.144924640655518, 4.31038761138916, 4.4758501052856445, 4.641312599182129, 4.8067755699157715, 4.972238540649414, 5.137701034545898]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 16.0, 51.0, 57.0, 98.0, 248.0, 505.0, 3050.0, 4179897.0, 9364.0, 776.0, 172.0, 31.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.4306640625, -34.580078125, -33.7294921875, -32.87890625, -32.0283203125, -31.177734375, -30.3271484375, -29.4765625, -28.6259765625, -27.775390625, -26.9248046875, -26.07421875, -25.2236328125, -24.373046875, -23.5224609375, -22.671875, -21.8212890625, -20.970703125, -20.1201171875, -19.26953125, -18.4189453125, -17.568359375, -16.7177734375, -15.8671875, -15.0166015625, -14.166015625, -13.3154296875, -12.46484375, -11.6142578125, -10.763671875, -9.9130859375, -9.0625, -8.2119140625, -7.361328125, -6.5107421875, -5.66015625, -4.8095703125, -3.958984375, -3.1083984375, -2.2578125, -1.4072265625, -0.556640625, 0.2939453125, 1.14453125, 1.9951171875, 2.845703125, 3.6962890625, 4.546875, 5.3974609375, 6.248046875, 7.0986328125, 7.94921875, 8.7998046875, 9.650390625, 10.5009765625, 11.3515625, 12.2021484375, 13.052734375, 13.9033203125, 14.75390625, 15.6044921875, 16.455078125, 17.3056640625, 18.15625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 21.0, 52.0, 745.0, 108.0, 31.0, 13.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.7061920166015625, -0.689239501953125, -0.6722869873046875, -0.65533447265625, -0.6383819580078125, -0.621429443359375, -0.6044769287109375, -0.5875244140625, -0.5705718994140625, -0.553619384765625, -0.5366668701171875, -0.51971435546875, -0.5027618408203125, -0.485809326171875, -0.4688568115234375, -0.451904296875, -0.4349517822265625, -0.417999267578125, -0.4010467529296875, -0.38409423828125, -0.3671417236328125, -0.350189208984375, -0.3332366943359375, -0.3162841796875, -0.2993316650390625, -0.282379150390625, -0.2654266357421875, -0.24847412109375, -0.2315216064453125, -0.214569091796875, -0.1976165771484375, -0.1806640625, -0.1637115478515625, -0.146759033203125, -0.1298065185546875, -0.11285400390625, -0.0959014892578125, -0.078948974609375, -0.0619964599609375, -0.0450439453125, -0.0280914306640625, -0.011138916015625, 0.0058135986328125, 0.02276611328125, 0.0397186279296875, 0.056671142578125, 0.0736236572265625, 0.090576171875, 0.1075286865234375, 0.124481201171875, 0.1414337158203125, 0.15838623046875, 0.1753387451171875, 0.192291259765625, 0.2092437744140625, 0.2261962890625, 0.2431488037109375, 0.260101318359375, 0.2770538330078125, 0.29400634765625, 0.3109588623046875, 0.327911376953125, 0.3448638916015625, 0.36181640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 12.0, 14.0, 15.0, 15.0, 27.0, 36.0, 52.0, 75.0, 145.0, 413.0, 1898.0, 17462.0, 4020071.0, 145773.0, 6373.0, 1075.0, 299.0, 146.0, 71.0, 58.0, 47.0, 39.0, 31.0, 27.0, 13.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.11383056640625, -3.9659423828125, -3.81805419921875, -3.670166015625, -3.52227783203125, -3.3743896484375, -3.22650146484375, -3.07861328125, -2.93072509765625, -2.7828369140625, -2.63494873046875, -2.487060546875, -2.33917236328125, -2.1912841796875, -2.04339599609375, -1.8955078125, -1.74761962890625, -1.5997314453125, -1.45184326171875, -1.303955078125, -1.15606689453125, -1.0081787109375, -0.86029052734375, -0.71240234375, -0.56451416015625, -0.4166259765625, -0.26873779296875, -0.120849609375, 0.02703857421875, 0.1749267578125, 0.32281494140625, 0.470703125, 0.61859130859375, 0.7664794921875, 0.91436767578125, 1.062255859375, 1.21014404296875, 1.3580322265625, 1.50592041015625, 1.65380859375, 1.80169677734375, 1.9495849609375, 2.09747314453125, 2.245361328125, 2.39324951171875, 2.5411376953125, 2.68902587890625, 2.8369140625, 2.98480224609375, 3.1326904296875, 3.28057861328125, 3.428466796875, 3.57635498046875, 3.7242431640625, 3.87213134765625, 4.02001953125, 4.16790771484375, 4.3157958984375, 4.46368408203125, 4.611572265625, 4.75946044921875, 4.9073486328125, 5.05523681640625, 5.203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 3.0, 10.0, 9.0, 13.0, 19.0, 11.0, 23.0, 18.0, 31.0, 27.0, 29.0, 42.0, 50.0, 58.0, 91.0, 180.0, 2791.0, 247.0, 100.0, 69.0, 44.0, 42.0, 31.0, 30.0, 18.0, 11.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.389892578125, -0.3789520263671875, -0.368011474609375, -0.3570709228515625, -0.34613037109375, -0.3351898193359375, -0.324249267578125, -0.3133087158203125, -0.3023681640625, -0.2914276123046875, -0.280487060546875, -0.2695465087890625, -0.25860595703125, -0.2476654052734375, -0.236724853515625, -0.2257843017578125, -0.21484375, -0.2039031982421875, -0.192962646484375, -0.1820220947265625, -0.17108154296875, -0.1601409912109375, -0.149200439453125, -0.1382598876953125, -0.1273193359375, -0.1163787841796875, -0.105438232421875, -0.0944976806640625, -0.08355712890625, -0.0726165771484375, -0.061676025390625, -0.0507354736328125, -0.039794921875, -0.0288543701171875, -0.017913818359375, -0.0069732666015625, 0.00396728515625, 0.0149078369140625, 0.025848388671875, 0.0367889404296875, 0.0477294921875, 0.0586700439453125, 0.069610595703125, 0.0805511474609375, 0.09149169921875, 0.1024322509765625, 0.113372802734375, 0.1243133544921875, 0.13525390625, 0.1461944580078125, 0.157135009765625, 0.1680755615234375, 0.17901611328125, 0.1899566650390625, 0.200897216796875, 0.2118377685546875, 0.2227783203125, 0.2337188720703125, 0.244659423828125, 0.2555999755859375, 0.26654052734375, 0.2774810791015625, 0.288421630859375, 0.2993621826171875, 0.310302734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 38.0, 685.0, 239.0, 26.0, 5.0, 3.0, 1.0, 1.0], "bins": [-11.203322410583496, -11.009543418884277, -10.815765380859375, -10.621986389160156, -10.428207397460938, -10.234429359436035, -10.040650367736816, -9.846872329711914, -9.653093338012695, -9.459314346313477, -9.265536308288574, -9.071757316589355, -8.877979278564453, -8.684200286865234, -8.490421295166016, -8.296643257141113, -8.102864265441895, -7.909085750579834, -7.715307235717773, -7.521528244018555, -7.327749729156494, -7.133971214294434, -6.940192222595215, -6.746413707733154, -6.552635192871094, -6.358856678009033, -6.165078163146973, -5.971299171447754, -5.777520656585693, -5.583742141723633, -5.389963150024414, -5.1961846351623535, -5.002406120300293, -4.808627605438232, -4.614849090576172, -4.421070098876953, -4.227291584014893, -4.033513069152832, -3.8397343158721924, -3.6459555625915527, -3.452176809310913, -3.2583980560302734, -3.064619541168213, -2.8708410263061523, -2.6770622730255127, -2.483283519744873, -2.2895050048828125, -2.095726490020752, -1.9019477367401123, -1.7081691026687622, -1.514390468597412, -1.320611834526062, -1.126833200454712, -0.9330545663833618, -0.7392759323120117, -0.5454972982406616, -0.3517186641693115, -0.15794003009796143, 0.03583860397338867, 0.22961723804473877, 0.42339587211608887, 0.617174506187439, 0.8109531402587891, 1.0047317743301392, 1.1985104084014893]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 20.0, 17.0, 39.0, 59.0, 90.0, 105.0, 115.0, 108.0, 124.0, 103.0, 70.0, 57.0, 37.0, 18.0, 13.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40962553024292, -2.3139803409576416, -2.2183351516723633, -2.122690200805664, -2.0270450115203857, -1.9313998222351074, -1.835754632949829, -1.7401094436645508, -1.6444642543792725, -1.5488190650939941, -1.4531739950180054, -1.357528805732727, -1.2618836164474487, -1.16623854637146, -1.0705933570861816, -0.9749481678009033, -0.8793030977249146, -0.783657968044281, -0.6880127787590027, -0.5923676490783691, -0.4967224895954132, -0.4010773301124573, -0.30543220043182373, -0.2097870111465454, -0.11414188146591187, -0.01849672943353653, 0.0771484225988388, 0.17279356718063354, 0.2684387266635895, 0.3640838861465454, 0.45972901582717896, 0.5553742051124573, 0.6510193347930908, 0.7466644644737244, 0.8423096537590027, 0.9379547834396362, 1.0335999727249146, 1.1292450428009033, 1.2248902320861816, 1.32053542137146, 1.4161806106567383, 1.5118257999420166, 1.6074708700180054, 1.7031160593032837, 1.798761248588562, 1.8944063186645508, 1.990051507949829, 2.0856966972351074, 2.1813416481018066, 2.276986837387085, 2.3726320266723633, 2.4682769775390625, 2.563922166824341, 2.659567356109619, 2.7552125453948975, 2.850857734680176, 2.946502923965454, 3.0421481132507324, 3.1377933025360107, 3.233438491821289, 3.3290834426879883, 3.4247286319732666, 3.520373821258545, 3.6160190105438232, 3.7116641998291016]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 7.0, 3.0, 7.0, 12.0, 18.0, 15.0, 14.0, 30.0, 52.0, 67.0, 76.0, 123.0, 206.0, 374.0, 613.0, 1310.0, 3806.0, 27881.0, 994686.0, 13800.0, 2895.0, 1092.0, 558.0, 316.0, 159.0, 144.0, 75.0, 50.0, 40.0, 25.0, 20.0, 17.0, 13.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.802734375, -3.692138671875, -3.58154296875, -3.470947265625, -3.3603515625, -3.249755859375, -3.13916015625, -3.028564453125, -2.91796875, -2.807373046875, -2.69677734375, -2.586181640625, -2.4755859375, -2.364990234375, -2.25439453125, -2.143798828125, -2.033203125, -1.922607421875, -1.81201171875, -1.701416015625, -1.5908203125, -1.480224609375, -1.36962890625, -1.259033203125, -1.1484375, -1.037841796875, -0.92724609375, -0.816650390625, -0.7060546875, -0.595458984375, -0.48486328125, -0.374267578125, -0.263671875, -0.153076171875, -0.04248046875, 0.068115234375, 0.1787109375, 0.289306640625, 0.39990234375, 0.510498046875, 0.62109375, 0.731689453125, 0.84228515625, 0.952880859375, 1.0634765625, 1.174072265625, 1.28466796875, 1.395263671875, 1.505859375, 1.616455078125, 1.72705078125, 1.837646484375, 1.9482421875, 2.058837890625, 2.16943359375, 2.280029296875, 2.390625, 2.501220703125, 2.61181640625, 2.722412109375, 2.8330078125, 2.943603515625, 3.05419921875, 3.164794921875, 3.275390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 13.0, 34.0, 332.0, 501.0, 73.0, 16.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6583137512207031, -0.6423110961914062, -0.6263084411621094, -0.6103057861328125, -0.5943031311035156, -0.5783004760742188, -0.5622978210449219, -0.546295166015625, -0.5302925109863281, -0.5142898559570312, -0.4982872009277344, -0.4822845458984375, -0.4662818908691406, -0.45027923583984375, -0.4342765808105469, -0.41827392578125, -0.4022712707519531, -0.38626861572265625, -0.3702659606933594, -0.3542633056640625, -0.3382606506347656, -0.32225799560546875, -0.3062553405761719, -0.290252685546875, -0.2742500305175781, -0.25824737548828125, -0.24224472045898438, -0.2262420654296875, -0.21023941040039062, -0.19423675537109375, -0.17823410034179688, -0.1622314453125, -0.14622879028320312, -0.13022613525390625, -0.11422348022460938, -0.0982208251953125, -0.08221817016601562, -0.06621551513671875, -0.050212860107421875, -0.034210205078125, -0.018207550048828125, -0.00220489501953125, 0.013797760009765625, 0.0298004150390625, 0.045803070068359375, 0.06180572509765625, 0.07780838012695312, 0.09381103515625, 0.10981369018554688, 0.12581634521484375, 0.14181900024414062, 0.1578216552734375, 0.17382431030273438, 0.18982696533203125, 0.20582962036132812, 0.221832275390625, 0.23783493041992188, 0.25383758544921875, 0.2698402404785156, 0.2858428955078125, 0.3018455505371094, 0.31784820556640625, 0.3338508605957031, 0.349853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 0.0, 6.0, 4.0, 10.0, 2.0, 7.0, 8.0, 13.0, 16.0, 17.0, 26.0, 28.0, 38.0, 47.0, 58.0, 97.0, 134.0, 228.0, 383.0, 741.0, 2018.0, 8788.0, 104758.0, 869254.0, 52860.0, 5835.0, 1493.0, 644.0, 356.0, 204.0, 138.0, 84.0, 54.0, 48.0, 32.0, 23.0, 22.0, 15.0, 10.0, 13.0, 6.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.592132568359375, -1.53973388671875, -1.487335205078125, -1.4349365234375, -1.382537841796875, -1.33013916015625, -1.277740478515625, -1.225341796875, -1.172943115234375, -1.12054443359375, -1.068145751953125, -1.0157470703125, -0.963348388671875, -0.91094970703125, -0.858551025390625, -0.80615234375, -0.753753662109375, -0.70135498046875, -0.648956298828125, -0.5965576171875, -0.544158935546875, -0.49176025390625, -0.439361572265625, -0.386962890625, -0.334564208984375, -0.28216552734375, -0.229766845703125, -0.1773681640625, -0.124969482421875, -0.07257080078125, -0.020172119140625, 0.0322265625, 0.084625244140625, 0.13702392578125, 0.189422607421875, 0.2418212890625, 0.294219970703125, 0.34661865234375, 0.399017333984375, 0.451416015625, 0.503814697265625, 0.55621337890625, 0.608612060546875, 0.6610107421875, 0.713409423828125, 0.76580810546875, 0.818206787109375, 0.87060546875, 0.923004150390625, 0.97540283203125, 1.027801513671875, 1.0802001953125, 1.132598876953125, 1.18499755859375, 1.237396240234375, 1.289794921875, 1.342193603515625, 1.39459228515625, 1.446990966796875, 1.4993896484375, 1.551788330078125, 1.60418701171875, 1.656585693359375, 1.708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 8.0, 9.0, 14.0, 10.0, 17.0, 20.0, 18.0, 27.0, 26.0, 29.0, 35.0, 32.0, 45.0, 41.0, 39.0, 41.0, 34.0, 39.0, 42.0, 48.0, 43.0, 38.0, 30.0, 34.0, 31.0, 29.0, 23.0, 25.0, 26.0, 19.0, 16.0, 14.0, 21.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.4827423095703125, -0.467437744140625, -0.4521331787109375, -0.43682861328125, -0.4215240478515625, -0.406219482421875, -0.3909149169921875, -0.3756103515625, -0.3603057861328125, -0.345001220703125, -0.3296966552734375, -0.31439208984375, -0.2990875244140625, -0.283782958984375, -0.2684783935546875, -0.253173828125, -0.2378692626953125, -0.222564697265625, -0.2072601318359375, -0.19195556640625, -0.1766510009765625, -0.161346435546875, -0.1460418701171875, -0.1307373046875, -0.1154327392578125, -0.100128173828125, -0.0848236083984375, -0.06951904296875, -0.0542144775390625, -0.038909912109375, -0.0236053466796875, -0.00830078125, 0.0070037841796875, 0.022308349609375, 0.0376129150390625, 0.05291748046875, 0.0682220458984375, 0.083526611328125, 0.0988311767578125, 0.1141357421875, 0.1294403076171875, 0.144744873046875, 0.1600494384765625, 0.17535400390625, 0.1906585693359375, 0.205963134765625, 0.2212677001953125, 0.236572265625, 0.2518768310546875, 0.267181396484375, 0.2824859619140625, 0.29779052734375, 0.3130950927734375, 0.328399658203125, 0.3437042236328125, 0.3590087890625, 0.3743133544921875, 0.389617919921875, 0.4049224853515625, 0.42022705078125, 0.4355316162109375, 0.450836181640625, 0.4661407470703125, 0.4814453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 12.0, 12.0, 19.0, 33.0, 27.0, 41.0, 90.0, 118.0, 184.0, 403.0, 1054.0, 3671.0, 24909.0, 779110.0, 222613.0, 12389.0, 2286.0, 707.0, 352.0, 160.0, 109.0, 78.0, 41.0, 34.0, 18.0, 15.0, 11.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2744941711425781, -0.26529693603515625, -0.2560997009277344, -0.2469024658203125, -0.23770523071289062, -0.22850799560546875, -0.21931076049804688, -0.210113525390625, -0.20091629028320312, -0.19171905517578125, -0.18252182006835938, -0.1733245849609375, -0.16412734985351562, -0.15493011474609375, -0.14573287963867188, -0.13653564453125, -0.12733840942382812, -0.11814117431640625, -0.10894393920898438, -0.0997467041015625, -0.09054946899414062, -0.08135223388671875, -0.07215499877929688, -0.062957763671875, -0.053760528564453125, -0.04456329345703125, -0.035366058349609375, -0.0261688232421875, -0.016971588134765625, -0.00777435302734375, 0.001422882080078125, 0.0106201171875, 0.019817352294921875, 0.02901458740234375, 0.038211822509765625, 0.0474090576171875, 0.056606292724609375, 0.06580352783203125, 0.07500076293945312, 0.084197998046875, 0.09339523315429688, 0.10259246826171875, 0.11178970336914062, 0.1209869384765625, 0.13018417358398438, 0.13938140869140625, 0.14857864379882812, 0.15777587890625, 0.16697311401367188, 0.17617034912109375, 0.18536758422851562, 0.1945648193359375, 0.20376205444335938, 0.21295928955078125, 0.22215652465820312, 0.231353759765625, 0.24055099487304688, 0.24974822998046875, 0.2589454650878906, 0.2681427001953125, 0.2773399353027344, 0.28653717041015625, 0.2957344055175781, 0.304931640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 10.0, 15.0, 24.0, 25.0, 29.0, 54.0, 64.0, 103.0, 117.0, 115.0, 108.0, 98.0, 61.0, 32.0, 35.0, 16.0, 17.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4543533325195312e-05, -1.4077872037887573e-05, -1.3612210750579834e-05, -1.3146549463272095e-05, -1.2680888175964355e-05, -1.2215226888656616e-05, -1.1749565601348877e-05, -1.1283904314041138e-05, -1.0818243026733398e-05, -1.035258173942566e-05, -9.88692045211792e-06, -9.42125916481018e-06, -8.955597877502441e-06, -8.489936590194702e-06, -8.024275302886963e-06, -7.558614015579224e-06, -7.092952728271484e-06, -6.627291440963745e-06, -6.161630153656006e-06, -5.695968866348267e-06, -5.230307579040527e-06, -4.764646291732788e-06, -4.298985004425049e-06, -3.8333237171173096e-06, -3.3676624298095703e-06, -2.902001142501831e-06, -2.436339855194092e-06, -1.9706785678863525e-06, -1.5050172805786133e-06, -1.039355993270874e-06, -5.736947059631348e-07, -1.0803341865539551e-07, 3.5762786865234375e-07, 8.23289155960083e-07, 1.2889504432678223e-06, 1.7546117305755615e-06, 2.2202730178833008e-06, 2.68593430519104e-06, 3.1515955924987793e-06, 3.6172568798065186e-06, 4.082918167114258e-06, 4.548579454421997e-06, 5.014240741729736e-06, 5.479902029037476e-06, 5.945563316345215e-06, 6.411224603652954e-06, 6.876885890960693e-06, 7.342547178268433e-06, 7.808208465576172e-06, 8.273869752883911e-06, 8.73953104019165e-06, 9.20519232749939e-06, 9.670853614807129e-06, 1.0136514902114868e-05, 1.0602176189422607e-05, 1.1067837476730347e-05, 1.1533498764038086e-05, 1.1999160051345825e-05, 1.2464821338653564e-05, 1.2930482625961304e-05, 1.3396143913269043e-05, 1.3861805200576782e-05, 1.4327466487884521e-05, 1.479312777519226e-05, 1.52587890625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 19.0, 43.0, 64.0, 79.0, 163.0, 359.0, 991.0, 5172.0, 133943.0, 894274.0, 10755.0, 1640.0, 506.0, 194.0, 106.0, 47.0, 51.0, 33.0, 15.0, 12.0, 5.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5057601928710938, -0.4900360107421875, -0.47431182861328125, -0.458587646484375, -0.44286346435546875, -0.4271392822265625, -0.41141510009765625, -0.39569091796875, -0.37996673583984375, -0.3642425537109375, -0.34851837158203125, -0.332794189453125, -0.31707000732421875, -0.3013458251953125, -0.28562164306640625, -0.2698974609375, -0.25417327880859375, -0.2384490966796875, -0.22272491455078125, -0.207000732421875, -0.19127655029296875, -0.1755523681640625, -0.15982818603515625, -0.14410400390625, -0.12837982177734375, -0.1126556396484375, -0.09693145751953125, -0.081207275390625, -0.06548309326171875, -0.0497589111328125, -0.03403472900390625, -0.018310546875, -0.00258636474609375, 0.0131378173828125, 0.02886199951171875, 0.044586181640625, 0.06031036376953125, 0.0760345458984375, 0.09175872802734375, 0.10748291015625, 0.12320709228515625, 0.1389312744140625, 0.15465545654296875, 0.170379638671875, 0.18610382080078125, 0.2018280029296875, 0.21755218505859375, 0.2332763671875, 0.24900054931640625, 0.2647247314453125, 0.28044891357421875, 0.296173095703125, 0.31189727783203125, 0.3276214599609375, 0.34334564208984375, 0.35906982421875, 0.37479400634765625, 0.3905181884765625, 0.40624237060546875, 0.421966552734375, 0.43769073486328125, 0.4534149169921875, 0.46913909912109375, 0.48486328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 3.0, 5.0, 9.0, 13.0, 17.0, 14.0, 22.0, 27.0, 40.0, 56.0, 89.0, 107.0, 107.0, 111.0, 87.0, 70.0, 58.0, 29.0, 18.0, 19.0, 23.0, 13.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12325859069824219, -0.11895370483398438, -0.11464881896972656, -0.11034393310546875, -0.10603904724121094, -0.10173416137695312, -0.09742927551269531, -0.0931243896484375, -0.08881950378417969, -0.08451461791992188, -0.08020973205566406, -0.07590484619140625, -0.07159996032714844, -0.06729507446289062, -0.06299018859863281, -0.058685302734375, -0.05438041687011719, -0.050075531005859375, -0.04577064514160156, -0.04146575927734375, -0.03716087341308594, -0.032855987548828125, -0.028551101684570312, -0.0242462158203125, -0.019941329956054688, -0.015636444091796875, -0.011331558227539062, -0.00702667236328125, -0.0027217864990234375, 0.001583099365234375, 0.0058879852294921875, 0.01019287109375, 0.014497756958007812, 0.018802642822265625, 0.023107528686523438, 0.02741241455078125, 0.03171730041503906, 0.036022186279296875, 0.04032707214355469, 0.0446319580078125, 0.04893684387207031, 0.053241729736328125, 0.05754661560058594, 0.06185150146484375, 0.06615638732910156, 0.07046127319335938, 0.07476615905761719, 0.079071044921875, 0.08337593078613281, 0.08768081665039062, 0.09198570251464844, 0.09629058837890625, 0.10059547424316406, 0.10490036010742188, 0.10920524597167969, 0.1135101318359375, 0.11781501770019531, 0.12211990356445312, 0.12642478942871094, 0.13072967529296875, 0.13503456115722656, 0.13933944702148438, 0.1436443328857422, 0.14794921875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 767.0, 237.0, 5.0], "bins": [-83.30458068847656, -81.95889282226562, -80.61321258544922, -79.26752471923828, -77.92184448242188, -76.57615661621094, -75.23047637939453, -73.8847885131836, -72.53910827636719, -71.19342041015625, -69.84774017333984, -68.5020523071289, -67.1563720703125, -65.81068420410156, -64.46500396728516, -63.11931610107422, -61.77362823486328, -60.42794418334961, -59.08226013183594, -57.736576080322266, -56.390892028808594, -55.045204162597656, -53.69952392578125, -52.35383605957031, -51.008155822753906, -49.662471771240234, -48.31678771972656, -46.97110366821289, -45.62541961669922, -44.27973175048828, -42.934051513671875, -41.58836364746094, -40.24268341064453, -38.89699935913086, -37.55131530761719, -36.205631256103516, -34.859947204589844, -33.514259338378906, -32.1685791015625, -30.822891235351562, -29.47720718383789, -28.13152313232422, -26.785839080810547, -25.440155029296875, -24.09446907043457, -22.7487850189209, -21.403100967407227, -20.057415008544922, -18.711732864379883, -17.36604881286621, -16.02036476135254, -14.67467975616455, -13.328994750976562, -11.98331069946289, -10.637626647949219, -9.29194164276123, -7.946257591247559, -6.6005730628967285, -5.254888534545898, -3.9092044830322266, -2.5635199546813965, -1.2178354263305664, 0.12784862518310547, 1.4735336303710938, 2.8192179203033447]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 13.0, 18.0, 21.0, 45.0, 53.0, 64.0, 68.0, 86.0, 77.0, 84.0, 75.0, 80.0, 77.0, 70.0, 55.0, 30.0, 26.0, 15.0, 8.0, 11.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881531715393066, -8.656502723693848, -8.431473731994629, -8.20644474029541, -7.981415748596191, -7.756386756896973, -7.531358242034912, -7.306329250335693, -7.081300258636475, -6.856271266937256, -6.631242275238037, -6.406213283538818, -6.181184768676758, -5.956155776977539, -5.73112678527832, -5.506097793579102, -5.281068801879883, -5.056039810180664, -4.831010818481445, -4.605981826782227, -4.380952835083008, -4.155923843383789, -3.9308953285217285, -3.7058663368225098, -3.480837345123291, -3.2558083534240723, -3.0307793617248535, -2.805750608444214, -2.580721616744995, -2.3556926250457764, -2.1306638717651367, -1.905634880065918, -1.6806058883666992, -1.4555768966674805, -1.2305480241775513, -1.005519151687622, -0.7804901599884033, -0.5554611682891846, -0.33043229579925537, -0.10540342330932617, 0.11962556838989258, 0.34465450048446655, 0.5696834325790405, 0.7947123646736145, 1.0197412967681885, 1.2447702884674072, 1.4697991609573364, 1.6948280334472656, 1.9198570251464844, 2.144886016845703, 2.369915008544922, 2.5949437618255615, 2.8199727535247803, 3.045001745223999, 3.2700304985046387, 3.4950594902038574, 3.720088481903076, 3.945117473602295, 4.170146465301514, 4.395175457000732, 4.620203971862793, 4.845232963562012, 5.0702619552612305, 5.295290946960449, 5.520319938659668]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 25.0, 35.0, 57.0, 153.0, 377.0, 3446.0, 4187331.0, 2425.0, 300.0, 72.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.9520263671875, -17.529052734375, -17.1060791015625, -16.68310546875, -16.2601318359375, -15.837158203125, -15.4141845703125, -14.9912109375, -14.5682373046875, -14.145263671875, -13.7222900390625, -13.29931640625, -12.8763427734375, -12.453369140625, -12.0303955078125, -11.607421875, -11.1844482421875, -10.761474609375, -10.3385009765625, -9.91552734375, -9.4925537109375, -9.069580078125, -8.6466064453125, -8.2236328125, -7.8006591796875, -7.377685546875, -6.9547119140625, -6.53173828125, -6.1087646484375, -5.685791015625, -5.2628173828125, -4.83984375, -4.4168701171875, -3.993896484375, -3.5709228515625, -3.14794921875, -2.7249755859375, -2.302001953125, -1.8790283203125, -1.4560546875, -1.0330810546875, -0.610107421875, -0.1871337890625, 0.23583984375, 0.6588134765625, 1.081787109375, 1.5047607421875, 1.927734375, 2.3507080078125, 2.773681640625, 3.1966552734375, 3.61962890625, 4.0426025390625, 4.465576171875, 4.8885498046875, 5.3115234375, 5.7344970703125, 6.157470703125, 6.5804443359375, 7.00341796875, 7.4263916015625, 7.849365234375, 8.2723388671875, 8.6953125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 15.0, 33.0, 227.0, 477.0, 176.0, 35.0, 13.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.713165283203125, -0.69635009765625, -0.679534912109375, -0.6627197265625, -0.645904541015625, -0.62908935546875, -0.612274169921875, -0.595458984375, -0.578643798828125, -0.56182861328125, -0.545013427734375, -0.5281982421875, -0.511383056640625, -0.49456787109375, -0.477752685546875, -0.4609375, -0.444122314453125, -0.42730712890625, -0.410491943359375, -0.3936767578125, -0.376861572265625, -0.36004638671875, -0.343231201171875, -0.326416015625, -0.309600830078125, -0.29278564453125, -0.275970458984375, -0.2591552734375, -0.242340087890625, -0.22552490234375, -0.208709716796875, -0.19189453125, -0.175079345703125, -0.15826416015625, -0.141448974609375, -0.1246337890625, -0.107818603515625, -0.09100341796875, -0.074188232421875, -0.057373046875, -0.040557861328125, -0.02374267578125, -0.006927490234375, 0.0098876953125, 0.026702880859375, 0.04351806640625, 0.060333251953125, 0.0771484375, 0.093963623046875, 0.11077880859375, 0.127593994140625, 0.1444091796875, 0.161224365234375, 0.17803955078125, 0.194854736328125, 0.211669921875, 0.228485107421875, 0.24530029296875, 0.262115478515625, 0.2789306640625, 0.295745849609375, 0.31256103515625, 0.329376220703125, 0.34619140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 6.0, 20.0, 10.0, 28.0, 45.0, 58.0, 139.0, 381.0, 1294.0, 4851.0, 30343.0, 4093876.0, 53959.0, 6754.0, 1572.0, 502.0, 174.0, 76.0, 50.0, 26.0, 19.0, 21.0, 12.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.28515625, -2.2171630859375, -2.149169921875, -2.0811767578125, -2.01318359375, -1.9451904296875, -1.877197265625, -1.8092041015625, -1.7412109375, -1.6732177734375, -1.605224609375, -1.5372314453125, -1.46923828125, -1.4012451171875, -1.333251953125, -1.2652587890625, -1.197265625, -1.1292724609375, -1.061279296875, -0.9932861328125, -0.92529296875, -0.8572998046875, -0.789306640625, -0.7213134765625, -0.6533203125, -0.5853271484375, -0.517333984375, -0.4493408203125, -0.38134765625, -0.3133544921875, -0.245361328125, -0.1773681640625, -0.109375, -0.0413818359375, 0.026611328125, 0.0946044921875, 0.16259765625, 0.2305908203125, 0.298583984375, 0.3665771484375, 0.4345703125, 0.5025634765625, 0.570556640625, 0.6385498046875, 0.70654296875, 0.7745361328125, 0.842529296875, 0.9105224609375, 0.978515625, 1.0465087890625, 1.114501953125, 1.1824951171875, 1.25048828125, 1.3184814453125, 1.386474609375, 1.4544677734375, 1.5224609375, 1.5904541015625, 1.658447265625, 1.7264404296875, 1.79443359375, 1.8624267578125, 1.930419921875, 1.9984130859375, 2.06640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 10.0, 6.0, 9.0, 7.0, 16.0, 12.0, 16.0, 30.0, 36.0, 58.0, 132.0, 2817.0, 594.0, 100.0, 62.0, 30.0, 25.0, 16.0, 12.0, 11.0, 11.0, 3.0, 8.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.299072265625, -0.2896919250488281, -0.28031158447265625, -0.2709312438964844, -0.2615509033203125, -0.2521705627441406, -0.24279022216796875, -0.23340988159179688, -0.224029541015625, -0.21464920043945312, -0.20526885986328125, -0.19588851928710938, -0.1865081787109375, -0.17712783813476562, -0.16774749755859375, -0.15836715698242188, -0.14898681640625, -0.13960647583007812, -0.13022613525390625, -0.12084579467773438, -0.1114654541015625, -0.10208511352539062, -0.09270477294921875, -0.08332443237304688, -0.073944091796875, -0.06456375122070312, -0.05518341064453125, -0.045803070068359375, -0.0364227294921875, -0.027042388916015625, -0.01766204833984375, -0.008281707763671875, 0.0010986328125, 0.010478973388671875, 0.01985931396484375, 0.029239654541015625, 0.0386199951171875, 0.048000335693359375, 0.05738067626953125, 0.06676101684570312, 0.076141357421875, 0.08552169799804688, 0.09490203857421875, 0.10428237915039062, 0.1136627197265625, 0.12304306030273438, 0.13242340087890625, 0.14180374145507812, 0.15118408203125, 0.16056442260742188, 0.16994476318359375, 0.17932510375976562, 0.1887054443359375, 0.19808578491210938, 0.20746612548828125, 0.21684646606445312, 0.226226806640625, 0.23560714721679688, 0.24498748779296875, 0.2543678283691406, 0.2637481689453125, 0.2731285095214844, 0.28250885009765625, 0.2918891906738281, 0.30126953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 51.0, 963.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9768232107162476, -0.5497756600379944, -0.12272810935974121, 0.30431950092315674, 0.7313669919967651, 1.1584144830703735, 1.585462212562561, 2.012509822845459, 2.4395570755004883, 2.8666045665740967, 3.293652057647705, 3.7206997871398926, 4.147747039794922, 4.574794769287109, 5.001842498779297, 5.428890228271484, 5.855937480926514, 6.282985210418701, 6.7100324630737305, 7.137080192565918, 7.5641279220581055, 7.991175174713135, 8.418222427368164, 8.845270156860352, 9.272317886352539, 9.699365615844727, 10.126413345336914, 10.553461074829102, 10.980507850646973, 11.40755558013916, 11.834603309631348, 12.261651039123535, 12.688697814941406, 13.115745544433594, 13.542793273925781, 13.969841003417969, 14.39688777923584, 14.823935508728027, 15.250983238220215, 15.678030967712402, 16.105077743530273, 16.53212547302246, 16.95917320251465, 17.386220932006836, 17.813268661499023, 18.240314483642578, 18.667362213134766, 19.094409942626953, 19.52145767211914, 19.948505401611328, 20.375553131103516, 20.802600860595703, 21.22964859008789, 21.656696319580078, 22.083744049072266, 22.51078987121582, 22.93783950805664, 23.364887237548828, 23.791934967041016, 24.218982696533203, 24.64603042602539, 25.073078155517578, 25.500125885009766, 25.92717170715332, 26.354219436645508]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 21.0, 54.0, 68.0, 107.0, 141.0, 123.0, 134.0, 118.0, 81.0, 47.0, 44.0, 32.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.183340072631836, -2.110987901687622, -2.038635730743408, -1.9662833213806152, -1.8939311504364014, -1.8215789794921875, -1.749226689338684, -1.6768743991851807, -1.6045222282409668, -1.532170057296753, -1.4598177671432495, -1.387465476989746, -1.3151133060455322, -1.2427611351013184, -1.170408844947815, -1.0980565547943115, -1.0257043838500977, -0.953352153301239, -0.8809999227523804, -0.8086476922035217, -0.7362954616546631, -0.6639432311058044, -0.5915910005569458, -0.5192387700080872, -0.4468865394592285, -0.3745343089103699, -0.30218207836151123, -0.2298298478126526, -0.15747761726379395, -0.0851253867149353, -0.01277315616607666, 0.05957907438278198, 0.13193154335021973, 0.20428377389907837, 0.276636004447937, 0.34898823499679565, 0.4213404655456543, 0.49369269609451294, 0.5660449266433716, 0.6383971571922302, 0.7107493877410889, 0.7831016182899475, 0.8554538488388062, 0.9278060793876648, 1.0001583099365234, 1.0725104808807373, 1.1448627710342407, 1.2172150611877441, 1.289567232131958, 1.3619194030761719, 1.4342716932296753, 1.5066239833831787, 1.5789761543273926, 1.6513283252716064, 1.7236806154251099, 1.7960329055786133, 1.8683850765228271, 1.940737247467041, 2.013089656829834, 2.085441827774048, 2.1577939987182617, 2.2301461696624756, 2.3024983406066895, 2.3748507499694824, 2.4472029209136963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 9.0, 8.0, 16.0, 20.0, 30.0, 54.0, 45.0, 79.0, 117.0, 194.0, 353.0, 568.0, 1379.0, 3836.0, 29829.0, 989515.0, 16875.0, 3028.0, 1131.0, 565.0, 330.0, 172.0, 107.0, 86.0, 53.0, 31.0, 28.0, 20.0, 12.0, 8.0, 8.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.166015625, -3.071258544921875, -2.97650146484375, -2.881744384765625, -2.7869873046875, -2.692230224609375, -2.59747314453125, -2.502716064453125, -2.407958984375, -2.313201904296875, -2.21844482421875, -2.123687744140625, -2.0289306640625, -1.934173583984375, -1.83941650390625, -1.744659423828125, -1.64990234375, -1.555145263671875, -1.46038818359375, -1.365631103515625, -1.2708740234375, -1.176116943359375, -1.08135986328125, -0.986602783203125, -0.891845703125, -0.797088623046875, -0.70233154296875, -0.607574462890625, -0.5128173828125, -0.418060302734375, -0.32330322265625, -0.228546142578125, -0.1337890625, -0.039031982421875, 0.05572509765625, 0.150482177734375, 0.2452392578125, 0.339996337890625, 0.43475341796875, 0.529510498046875, 0.624267578125, 0.719024658203125, 0.81378173828125, 0.908538818359375, 1.0032958984375, 1.098052978515625, 1.19281005859375, 1.287567138671875, 1.38232421875, 1.477081298828125, 1.57183837890625, 1.666595458984375, 1.7613525390625, 1.856109619140625, 1.95086669921875, 2.045623779296875, 2.140380859375, 2.235137939453125, 2.32989501953125, 2.424652099609375, 2.5194091796875, 2.614166259765625, 2.70892333984375, 2.803680419921875, 2.8984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 16.0, 147.0, 447.0, 293.0, 47.0, 15.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6756973266601562, -0.6595001220703125, -0.6433029174804688, -0.627105712890625, -0.6109085083007812, -0.5947113037109375, -0.5785140991210938, -0.56231689453125, -0.5461196899414062, -0.5299224853515625, -0.5137252807617188, -0.497528076171875, -0.48133087158203125, -0.4651336669921875, -0.44893646240234375, -0.4327392578125, -0.41654205322265625, -0.4003448486328125, -0.38414764404296875, -0.367950439453125, -0.35175323486328125, -0.3355560302734375, -0.31935882568359375, -0.30316162109375, -0.28696441650390625, -0.2707672119140625, -0.25457000732421875, -0.238372802734375, -0.22217559814453125, -0.2059783935546875, -0.18978118896484375, -0.173583984375, -0.15738677978515625, -0.1411895751953125, -0.12499237060546875, -0.108795166015625, -0.09259796142578125, -0.0764007568359375, -0.06020355224609375, -0.04400634765625, -0.02780914306640625, -0.0116119384765625, 0.00458526611328125, 0.020782470703125, 0.03697967529296875, 0.0531768798828125, 0.06937408447265625, 0.0855712890625, 0.10176849365234375, 0.1179656982421875, 0.13416290283203125, 0.150360107421875, 0.16655731201171875, 0.1827545166015625, 0.19895172119140625, 0.21514892578125, 0.23134613037109375, 0.2475433349609375, 0.26374053955078125, 0.279937744140625, 0.29613494873046875, 0.3123321533203125, 0.32852935791015625, 0.3447265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 27.0, 29.0, 45.0, 39.0, 74.0, 127.0, 206.0, 463.0, 1145.0, 6883.0, 224796.0, 798741.0, 13041.0, 1616.0, 559.0, 268.0, 139.0, 77.0, 46.0, 50.0, 26.0, 22.0, 15.0, 19.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.618927001953125, -2.54644775390625, -2.473968505859375, -2.4014892578125, -2.329010009765625, -2.25653076171875, -2.184051513671875, -2.111572265625, -2.039093017578125, -1.96661376953125, -1.894134521484375, -1.8216552734375, -1.749176025390625, -1.67669677734375, -1.604217529296875, -1.53173828125, -1.459259033203125, -1.38677978515625, -1.314300537109375, -1.2418212890625, -1.169342041015625, -1.09686279296875, -1.024383544921875, -0.951904296875, -0.879425048828125, -0.80694580078125, -0.734466552734375, -0.6619873046875, -0.589508056640625, -0.51702880859375, -0.444549560546875, -0.3720703125, -0.299591064453125, -0.22711181640625, -0.154632568359375, -0.0821533203125, -0.009674072265625, 0.06280517578125, 0.135284423828125, 0.207763671875, 0.280242919921875, 0.35272216796875, 0.425201416015625, 0.4976806640625, 0.570159912109375, 0.64263916015625, 0.715118408203125, 0.78759765625, 0.860076904296875, 0.93255615234375, 1.005035400390625, 1.0775146484375, 1.149993896484375, 1.22247314453125, 1.294952392578125, 1.367431640625, 1.439910888671875, 1.51239013671875, 1.584869384765625, 1.6573486328125, 1.729827880859375, 1.80230712890625, 1.874786376953125, 1.947265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 7.0, 5.0, 14.0, 9.0, 17.0, 17.0, 20.0, 24.0, 26.0, 33.0, 43.0, 49.0, 44.0, 49.0, 58.0, 46.0, 48.0, 52.0, 52.0, 66.0, 50.0, 46.0, 33.0, 30.0, 31.0, 31.0, 29.0, 17.0, 14.0, 10.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6110763549804688, -0.5873870849609375, -0.5636978149414062, -0.540008544921875, -0.5163192749023438, -0.4926300048828125, -0.46894073486328125, -0.44525146484375, -0.42156219482421875, -0.3978729248046875, -0.37418365478515625, -0.350494384765625, -0.32680511474609375, -0.3031158447265625, -0.27942657470703125, -0.2557373046875, -0.23204803466796875, -0.2083587646484375, -0.18466949462890625, -0.160980224609375, -0.13729095458984375, -0.1136016845703125, -0.08991241455078125, -0.06622314453125, -0.04253387451171875, -0.0188446044921875, 0.00484466552734375, 0.028533935546875, 0.05222320556640625, 0.0759124755859375, 0.09960174560546875, 0.123291015625, 0.14698028564453125, 0.1706695556640625, 0.19435882568359375, 0.218048095703125, 0.24173736572265625, 0.2654266357421875, 0.28911590576171875, 0.31280517578125, 0.33649444580078125, 0.3601837158203125, 0.38387298583984375, 0.407562255859375, 0.43125152587890625, 0.4549407958984375, 0.47863006591796875, 0.5023193359375, 0.5260086059570312, 0.5496978759765625, 0.5733871459960938, 0.597076416015625, 0.6207656860351562, 0.6444549560546875, 0.6681442260742188, 0.69183349609375, 0.7155227661132812, 0.7392120361328125, 0.7629013061523438, 0.786590576171875, 0.8102798461914062, 0.8339691162109375, 0.8576583862304688, 0.88134765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 8.0, 6.0, 4.0, 8.0, 14.0, 27.0, 31.0, 60.0, 101.0, 205.0, 560.0, 2577.0, 53870.0, 974102.0, 14871.0, 1363.0, 366.0, 159.0, 95.0, 39.0, 32.0, 16.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.67236328125, -0.6533355712890625, -0.634307861328125, -0.6152801513671875, -0.59625244140625, -0.5772247314453125, -0.558197021484375, -0.5391693115234375, -0.5201416015625, -0.5011138916015625, -0.482086181640625, -0.4630584716796875, -0.44403076171875, -0.4250030517578125, -0.405975341796875, -0.3869476318359375, -0.367919921875, -0.3488922119140625, -0.329864501953125, -0.3108367919921875, -0.29180908203125, -0.2727813720703125, -0.253753662109375, -0.2347259521484375, -0.2156982421875, -0.1966705322265625, -0.177642822265625, -0.1586151123046875, -0.13958740234375, -0.1205596923828125, -0.101531982421875, -0.0825042724609375, -0.0634765625, -0.0444488525390625, -0.025421142578125, -0.0063934326171875, 0.01263427734375, 0.0316619873046875, 0.050689697265625, 0.0697174072265625, 0.0887451171875, 0.1077728271484375, 0.126800537109375, 0.1458282470703125, 0.16485595703125, 0.1838836669921875, 0.202911376953125, 0.2219390869140625, 0.240966796875, 0.2599945068359375, 0.279022216796875, 0.2980499267578125, 0.31707763671875, 0.3361053466796875, 0.355133056640625, 0.3741607666015625, 0.3931884765625, 0.4122161865234375, 0.431243896484375, 0.4502716064453125, 0.46929931640625, 0.4883270263671875, 0.507354736328125, 0.5263824462890625, 0.54541015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 19.0, 20.0, 33.0, 59.0, 129.0, 165.0, 141.0, 155.0, 94.0, 61.0, 35.0, 26.0, 12.0, 10.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.3089349269866943e-05, -2.2396445274353027e-05, -2.170354127883911e-05, -2.1010637283325195e-05, -2.031773328781128e-05, -1.9624829292297363e-05, -1.8931925296783447e-05, -1.823902130126953e-05, -1.7546117305755615e-05, -1.68532133102417e-05, -1.6160309314727783e-05, -1.5467405319213867e-05, -1.4774501323699951e-05, -1.4081597328186035e-05, -1.3388693332672119e-05, -1.2695789337158203e-05, -1.2002885341644287e-05, -1.1309981346130371e-05, -1.0617077350616455e-05, -9.924173355102539e-06, -9.231269359588623e-06, -8.538365364074707e-06, -7.845461368560791e-06, -7.152557373046875e-06, -6.459653377532959e-06, -5.766749382019043e-06, -5.073845386505127e-06, -4.380941390991211e-06, -3.688037395477295e-06, -2.995133399963379e-06, -2.302229404449463e-06, -1.6093254089355469e-06, -9.164214134216309e-07, -2.2351741790771484e-07, 4.6938657760620117e-07, 1.1622905731201172e-06, 1.8551945686340332e-06, 2.5480985641479492e-06, 3.2410025596618652e-06, 3.933906555175781e-06, 4.626810550689697e-06, 5.319714546203613e-06, 6.012618541717529e-06, 6.705522537231445e-06, 7.398426532745361e-06, 8.091330528259277e-06, 8.784234523773193e-06, 9.47713851928711e-06, 1.0170042514801025e-05, 1.0862946510314941e-05, 1.1555850505828857e-05, 1.2248754501342773e-05, 1.294165849685669e-05, 1.3634562492370605e-05, 1.4327466487884521e-05, 1.5020370483398438e-05, 1.5713274478912354e-05, 1.640617847442627e-05, 1.7099082469940186e-05, 1.77919864654541e-05, 1.8484890460968018e-05, 1.9177794456481934e-05, 1.987069845199585e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 10.0, 15.0, 12.0, 25.0, 42.0, 61.0, 117.0, 200.0, 441.0, 1872.0, 17194.0, 952340.0, 70721.0, 3963.0, 855.0, 295.0, 138.0, 86.0, 38.0, 31.0, 22.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.6865234375, -0.6687812805175781, -0.6510391235351562, -0.6332969665527344, -0.6155548095703125, -0.5978126525878906, -0.5800704956054688, -0.5623283386230469, -0.544586181640625, -0.5268440246582031, -0.5091018676757812, -0.4913597106933594, -0.4736175537109375, -0.4558753967285156, -0.43813323974609375, -0.4203910827636719, -0.40264892578125, -0.3849067687988281, -0.36716461181640625, -0.3494224548339844, -0.3316802978515625, -0.3139381408691406, -0.29619598388671875, -0.2784538269042969, -0.260711669921875, -0.24296951293945312, -0.22522735595703125, -0.20748519897460938, -0.1897430419921875, -0.17200088500976562, -0.15425872802734375, -0.13651657104492188, -0.1187744140625, -0.10103225708007812, -0.08329010009765625, -0.06554794311523438, -0.0478057861328125, -0.030063629150390625, -0.01232147216796875, 0.005420684814453125, 0.023162841796875, 0.040904998779296875, 0.05864715576171875, 0.07638931274414062, 0.0941314697265625, 0.11187362670898438, 0.12961578369140625, 0.14735794067382812, 0.16510009765625, 0.18284225463867188, 0.20058441162109375, 0.21832656860351562, 0.2360687255859375, 0.2538108825683594, 0.27155303955078125, 0.2892951965332031, 0.307037353515625, 0.3247795104980469, 0.34252166748046875, 0.3602638244628906, 0.3780059814453125, 0.3957481384277344, 0.41349029541015625, 0.4312324523925781, 0.448974609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 7.0, 10.0, 7.0, 18.0, 29.0, 35.0, 51.0, 70.0, 82.0, 103.0, 127.0, 120.0, 79.0, 75.0, 38.0, 34.0, 26.0, 18.0, 6.0, 13.0, 10.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1480712890625, -0.14200782775878906, -0.13594436645507812, -0.1298809051513672, -0.12381744384765625, -0.11775398254394531, -0.11169052124023438, -0.10562705993652344, -0.0995635986328125, -0.09350013732910156, -0.08743667602539062, -0.08137321472167969, -0.07530975341796875, -0.06924629211425781, -0.06318283081054688, -0.05711936950683594, -0.051055908203125, -0.04499244689941406, -0.038928985595703125, -0.03286552429199219, -0.02680206298828125, -0.020738601684570312, -0.014675140380859375, -0.008611679077148438, -0.0025482177734375, 0.0035152435302734375, 0.009578704833984375, 0.015642166137695312, 0.02170562744140625, 0.027769088745117188, 0.033832550048828125, 0.03989601135253906, 0.04595947265625, 0.05202293395996094, 0.058086395263671875, 0.06414985656738281, 0.07021331787109375, 0.07627677917480469, 0.08234024047851562, 0.08840370178222656, 0.0944671630859375, 0.10053062438964844, 0.10659408569335938, 0.11265754699707031, 0.11872100830078125, 0.12478446960449219, 0.13084793090820312, 0.13691139221191406, 0.142974853515625, 0.14903831481933594, 0.15510177612304688, 0.1611652374267578, 0.16722869873046875, 0.1732921600341797, 0.17935562133789062, 0.18541908264160156, 0.1914825439453125, 0.19754600524902344, 0.20360946655273438, 0.2096729278564453, 0.21573638916015625, 0.2217998504638672, 0.22786331176757812, 0.23392677307128906, 0.239990234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 227.0, 716.0, 43.0, 5.0, 0.0, 1.0], "bins": [-41.116172790527344, -40.42205047607422, -39.72792434692383, -39.0338020324707, -38.33967590332031, -37.64555358886719, -36.95143127441406, -36.25730514526367, -35.56318283081055, -34.86906051635742, -34.17493438720703, -33.480812072753906, -32.786685943603516, -32.09256362915039, -31.398439407348633, -30.704315185546875, -30.010189056396484, -29.316064834594727, -28.62194061279297, -27.927818298339844, -27.233694076538086, -26.539569854736328, -25.84544563293457, -25.151321411132812, -24.457199096679688, -23.76307487487793, -23.068950653076172, -22.374828338623047, -21.68070411682129, -20.98657989501953, -20.292455673217773, -19.598331451416016, -18.904207229614258, -18.2100830078125, -17.515958786010742, -16.821834564208984, -16.12771224975586, -15.433588027954102, -14.739463806152344, -14.045339584350586, -13.351215362548828, -12.65709114074707, -11.962967872619629, -11.268843650817871, -10.574719429016113, -9.880596160888672, -9.186471939086914, -8.492347717285156, -7.798224449157715, -7.104100704193115, -6.409976482391357, -5.715852737426758, -5.021728515625, -4.3276047706604, -3.633481025695801, -2.939356803894043, -2.2452330589294434, -1.5511090755462646, -0.8569852113723755, -0.16286134719848633, 0.5312626361846924, 1.225386619567871, 1.9195103645324707, 2.6136345863342285, 3.307758331298828]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 15.0, 25.0, 27.0, 24.0, 33.0, 36.0, 45.0, 49.0, 54.0, 61.0, 74.0, 69.0, 76.0, 60.0, 56.0, 52.0, 48.0, 31.0, 32.0, 29.0, 24.0, 19.0, 14.0, 6.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.673714637756348, -4.497820854187012, -4.321927070617676, -4.14603328704834, -3.970139503479004, -3.794245719909668, -3.618351936340332, -3.442458152770996, -3.26656436920166, -3.090670585632324, -2.9147768020629883, -2.7388830184936523, -2.5629892349243164, -2.3870954513549805, -2.2112016677856445, -2.0353078842163086, -1.8594141006469727, -1.6835203170776367, -1.5076265335083008, -1.3317327499389648, -1.155838966369629, -0.979945182800293, -0.804051399230957, -0.6281576156616211, -0.45226383209228516, -0.2763700485229492, -0.10047626495361328, 0.07541751861572266, 0.2513113021850586, 0.42720508575439453, 0.6030988693237305, 0.7789926528930664, 0.9548859596252441, 1.13077974319458, 1.306673526763916, 1.482567310333252, 1.658461093902588, 1.8343548774719238, 2.0102486610412598, 2.1861424446105957, 2.3620362281799316, 2.5379300117492676, 2.7138237953186035, 2.8897175788879395, 3.0656113624572754, 3.2415051460266113, 3.4173989295959473, 3.593292713165283, 3.769186496734619, 3.945080280303955, 4.120974063873291, 4.296867847442627, 4.472761631011963, 4.648655414581299, 4.824549198150635, 5.000442981719971, 5.176336765289307, 5.352230548858643, 5.5281243324279785, 5.7040181159973145, 5.87991189956665, 6.055805683135986, 6.231699466705322, 6.407593250274658, 6.583487033843994]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 16.0, 12.0, 23.0, 37.0, 106.0, 201.0, 956.0, 393109.0, 3798517.0, 962.0, 196.0, 65.0, 37.0, 10.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -7.031829833984375, -6.86444091796875, -6.697052001953125, -6.5296630859375, -6.362274169921875, -6.19488525390625, -6.027496337890625, -5.860107421875, -5.692718505859375, -5.52532958984375, -5.357940673828125, -5.1905517578125, -5.023162841796875, -4.85577392578125, -4.688385009765625, -4.52099609375, -4.353607177734375, -4.18621826171875, -4.018829345703125, -3.8514404296875, -3.684051513671875, -3.51666259765625, -3.349273681640625, -3.181884765625, -3.014495849609375, -2.84710693359375, -2.679718017578125, -2.5123291015625, -2.344940185546875, -2.17755126953125, -2.010162353515625, -1.8427734375, -1.675384521484375, -1.50799560546875, -1.340606689453125, -1.1732177734375, -1.005828857421875, -0.83843994140625, -0.671051025390625, -0.503662109375, -0.336273193359375, -0.16888427734375, -0.001495361328125, 0.1658935546875, 0.333282470703125, 0.50067138671875, 0.668060302734375, 0.83544921875, 1.002838134765625, 1.17022705078125, 1.337615966796875, 1.5050048828125, 1.672393798828125, 1.83978271484375, 2.007171630859375, 2.174560546875, 2.341949462890625, 2.50933837890625, 2.676727294921875, 2.8441162109375, 3.011505126953125, 3.17889404296875, 3.346282958984375, 3.513671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 17.0, 102.0, 263.0, 375.0, 163.0, 45.0, 12.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7054595947265625, -0.688751220703125, -0.6720428466796875, -0.65533447265625, -0.6386260986328125, -0.621917724609375, -0.6052093505859375, -0.5885009765625, -0.5717926025390625, -0.555084228515625, -0.5383758544921875, -0.52166748046875, -0.5049591064453125, -0.488250732421875, -0.4715423583984375, -0.454833984375, -0.4381256103515625, -0.421417236328125, -0.4047088623046875, -0.38800048828125, -0.3712921142578125, -0.354583740234375, -0.3378753662109375, -0.3211669921875, -0.3044586181640625, -0.287750244140625, -0.2710418701171875, -0.25433349609375, -0.2376251220703125, -0.220916748046875, -0.2042083740234375, -0.1875, -0.1707916259765625, -0.154083251953125, -0.1373748779296875, -0.12066650390625, -0.1039581298828125, -0.087249755859375, -0.0705413818359375, -0.0538330078125, -0.0371246337890625, -0.020416259765625, -0.0037078857421875, 0.01300048828125, 0.0297088623046875, 0.046417236328125, 0.0631256103515625, 0.079833984375, 0.0965423583984375, 0.113250732421875, 0.1299591064453125, 0.14666748046875, 0.1633758544921875, 0.180084228515625, 0.1967926025390625, 0.2135009765625, 0.2302093505859375, 0.246917724609375, 0.2636260986328125, 0.28033447265625, 0.2970428466796875, 0.313751220703125, 0.3304595947265625, 0.34716796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 24.0, 51.0, 91.0, 204.0, 675.0, 2005.0, 8554.0, 195867.0, 3971307.0, 12140.0, 2263.0, 631.0, 206.0, 110.0, 45.0, 18.0, 15.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.3935394287109375, -1.345672607421875, -1.2978057861328125, -1.24993896484375, -1.2020721435546875, -1.154205322265625, -1.1063385009765625, -1.0584716796875, -1.0106048583984375, -0.962738037109375, -0.9148712158203125, -0.86700439453125, -0.8191375732421875, -0.771270751953125, -0.7234039306640625, -0.675537109375, -0.6276702880859375, -0.579803466796875, -0.5319366455078125, -0.48406982421875, -0.4362030029296875, -0.388336181640625, -0.3404693603515625, -0.2926025390625, -0.2447357177734375, -0.196868896484375, -0.1490020751953125, -0.10113525390625, -0.0532684326171875, -0.005401611328125, 0.0424652099609375, 0.09033203125, 0.1381988525390625, 0.186065673828125, 0.2339324951171875, 0.28179931640625, 0.3296661376953125, 0.377532958984375, 0.4253997802734375, 0.4732666015625, 0.5211334228515625, 0.569000244140625, 0.6168670654296875, 0.66473388671875, 0.7126007080078125, 0.760467529296875, 0.8083343505859375, 0.856201171875, 0.9040679931640625, 0.951934814453125, 0.9998016357421875, 1.04766845703125, 1.0955352783203125, 1.143402099609375, 1.1912689208984375, 1.2391357421875, 1.2870025634765625, 1.334869384765625, 1.3827362060546875, 1.43060302734375, 1.4784698486328125, 1.526336669921875, 1.5742034912109375, 1.6220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 18.0, 38.0, 50.0, 113.0, 1190.0, 2374.0, 114.0, 42.0, 23.0, 19.0, 10.0, 9.0, 2.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3296661376953125, -0.319976806640625, -0.3102874755859375, -0.30059814453125, -0.2909088134765625, -0.281219482421875, -0.2715301513671875, -0.2618408203125, -0.2521514892578125, -0.242462158203125, -0.2327728271484375, -0.22308349609375, -0.2133941650390625, -0.203704833984375, -0.1940155029296875, -0.184326171875, -0.1746368408203125, -0.164947509765625, -0.1552581787109375, -0.14556884765625, -0.1358795166015625, -0.126190185546875, -0.1165008544921875, -0.1068115234375, -0.0971221923828125, -0.087432861328125, -0.0777435302734375, -0.06805419921875, -0.0583648681640625, -0.048675537109375, -0.0389862060546875, -0.029296875, -0.0196075439453125, -0.009918212890625, -0.0002288818359375, 0.00946044921875, 0.0191497802734375, 0.028839111328125, 0.0385284423828125, 0.0482177734375, 0.0579071044921875, 0.067596435546875, 0.0772857666015625, 0.08697509765625, 0.0966644287109375, 0.106353759765625, 0.1160430908203125, 0.125732421875, 0.1354217529296875, 0.145111083984375, 0.1548004150390625, 0.16448974609375, 0.1741790771484375, 0.183868408203125, 0.1935577392578125, 0.2032470703125, 0.2129364013671875, 0.222625732421875, 0.2323150634765625, 0.24200439453125, 0.2516937255859375, 0.261383056640625, 0.2710723876953125, 0.28076171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 60.0, 323.0, 477.0, 88.0, 27.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5450942516326904, -1.488369107246399, -1.4316439628601074, -1.374918818473816, -1.3181936740875244, -1.2614684104919434, -1.2047433853149414, -1.1480181217193604, -1.0912929773330688, -1.0345678329467773, -0.9778426885604858, -0.9211175441741943, -0.8643923401832581, -0.8076671957969666, -0.750942051410675, -0.6942168474197388, -0.637491762638092, -0.5807666182518005, -0.524041473865509, -0.46731629967689514, -0.41059112548828125, -0.35386598110198975, -0.29714083671569824, -0.24041566252708435, -0.18369051814079285, -0.12696535885334015, -0.07024020701646805, -0.013515055179595947, 0.04321010410785675, 0.09993526339530945, 0.15666040778160095, 0.21338558197021484, 0.27011072635650635, 0.32683587074279785, 0.38356104493141174, 0.44028618931770325, 0.49701136350631714, 0.5537365078926086, 0.6104616522789001, 0.6671868562698364, 0.7239120006561279, 0.7806371450424194, 0.8373622894287109, 0.8940874338150024, 0.9508126378059387, 1.007537841796875, 1.064262866973877, 1.120988130569458, 1.17771315574646, 1.2344383001327515, 1.291163444519043, 1.3478885889053345, 1.404613733291626, 1.461338996887207, 1.518064022064209, 1.57478928565979, 1.6315144300460815, 1.688239574432373, 1.7449647188186646, 1.801689863204956, 1.8584150075912476, 1.915140151977539, 1.9718654155731201, 2.028590440750122, 2.085315704345703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 14.0, 16.0, 12.0, 23.0, 20.0, 45.0, 56.0, 57.0, 75.0, 74.0, 83.0, 92.0, 78.0, 69.0, 56.0, 55.0, 42.0, 43.0, 32.0, 13.0, 17.0, 8.0, 10.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8000990748405457, -0.7672092318534851, -0.7343193888664246, -0.701429545879364, -0.6685397028923035, -0.6356498599052429, -0.6027599573135376, -0.569870114326477, -0.5369802713394165, -0.504090428352356, -0.4712005853652954, -0.43831074237823486, -0.4054208993911743, -0.37253105640411377, -0.33964118361473083, -0.3067513406276703, -0.27386152744293213, -0.24097168445587158, -0.20808184146881104, -0.1751919835805893, -0.14230214059352875, -0.1094122976064682, -0.07652243971824646, -0.04363259673118591, -0.010742753744125366, 0.02214709296822548, 0.055036939680576324, 0.08792679011821747, 0.12081663310527802, 0.15370647609233856, 0.1865963339805603, 0.21948617696762085, 0.2523759603500366, 0.28526580333709717, 0.3181556463241577, 0.35104548931121826, 0.3839353322982788, 0.41682517528533936, 0.4497150480747223, 0.48260489106178284, 0.515494704246521, 0.5483845472335815, 0.5812743902206421, 0.6141642332077026, 0.6470540761947632, 0.6799439191818237, 0.7128337621688843, 0.7457236051559448, 0.7786135077476501, 0.8115033507347107, 0.8443931937217712, 0.8772830367088318, 0.9101728796958923, 0.9430627226829529, 0.9759526252746582, 1.0088424682617188, 1.0417323112487793, 1.0746221542358398, 1.1075119972229004, 1.140401840209961, 1.1732916831970215, 1.206181526184082, 1.2390713691711426, 1.2719612121582031, 1.3048510551452637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 8.0, 18.0, 26.0, 26.0, 36.0, 59.0, 89.0, 124.0, 243.0, 419.0, 832.0, 1837.0, 6113.0, 201654.0, 822506.0, 10041.0, 2291.0, 966.0, 486.0, 268.0, 138.0, 84.0, 84.0, 44.0, 28.0, 34.0, 19.0, 8.0, 13.0, 10.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6361541748046875, -1.577972412109375, -1.5197906494140625, -1.46160888671875, -1.4034271240234375, -1.345245361328125, -1.2870635986328125, -1.2288818359375, -1.1707000732421875, -1.112518310546875, -1.0543365478515625, -0.99615478515625, -0.9379730224609375, -0.879791259765625, -0.8216094970703125, -0.763427734375, -0.7052459716796875, -0.647064208984375, -0.5888824462890625, -0.53070068359375, -0.4725189208984375, -0.414337158203125, -0.3561553955078125, -0.2979736328125, -0.2397918701171875, -0.181610107421875, -0.1234283447265625, -0.06524658203125, -0.0070648193359375, 0.051116943359375, 0.1092987060546875, 0.16748046875, 0.2256622314453125, 0.283843994140625, 0.3420257568359375, 0.40020751953125, 0.4583892822265625, 0.516571044921875, 0.5747528076171875, 0.6329345703125, 0.6911163330078125, 0.749298095703125, 0.8074798583984375, 0.86566162109375, 0.9238433837890625, 0.982025146484375, 1.0402069091796875, 1.098388671875, 1.1565704345703125, 1.214752197265625, 1.2729339599609375, 1.33111572265625, 1.3892974853515625, 1.447479248046875, 1.5056610107421875, 1.5638427734375, 1.6220245361328125, 1.680206298828125, 1.7383880615234375, 1.79656982421875, 1.8547515869140625, 1.912933349609375, 1.9711151123046875, 2.029296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 34.0, 162.0, 343.0, 302.0, 98.0, 25.0, 15.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.684326171875, -0.66796875, -0.651611328125, -0.63525390625, -0.618896484375, -0.6025390625, -0.586181640625, -0.56982421875, -0.553466796875, -0.537109375, -0.520751953125, -0.50439453125, -0.488037109375, -0.4716796875, -0.455322265625, -0.43896484375, -0.422607421875, -0.40625, -0.389892578125, -0.37353515625, -0.357177734375, -0.3408203125, -0.324462890625, -0.30810546875, -0.291748046875, -0.275390625, -0.259033203125, -0.24267578125, -0.226318359375, -0.2099609375, -0.193603515625, -0.17724609375, -0.160888671875, -0.14453125, -0.128173828125, -0.11181640625, -0.095458984375, -0.0791015625, -0.062744140625, -0.04638671875, -0.030029296875, -0.013671875, 0.002685546875, 0.01904296875, 0.035400390625, 0.0517578125, 0.068115234375, 0.08447265625, 0.100830078125, 0.1171875, 0.133544921875, 0.14990234375, 0.166259765625, 0.1826171875, 0.198974609375, 0.21533203125, 0.231689453125, 0.248046875, 0.264404296875, 0.28076171875, 0.297119140625, 0.3134765625, 0.329833984375, 0.34619140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 15.0, 15.0, 18.0, 18.0, 13.0, 45.0, 35.0, 42.0, 81.0, 126.0, 248.0, 499.0, 1552.0, 9899.0, 218602.0, 788827.0, 24418.0, 2538.0, 745.0, 321.0, 151.0, 97.0, 62.0, 36.0, 27.0, 15.0, 14.0, 17.0, 14.0, 9.0, 10.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5290985107421875, -1.483001708984375, -1.4369049072265625, -1.39080810546875, -1.3447113037109375, -1.298614501953125, -1.2525177001953125, -1.2064208984375, -1.1603240966796875, -1.114227294921875, -1.0681304931640625, -1.02203369140625, -0.9759368896484375, -0.929840087890625, -0.8837432861328125, -0.837646484375, -0.7915496826171875, -0.745452880859375, -0.6993560791015625, -0.65325927734375, -0.6071624755859375, -0.561065673828125, -0.5149688720703125, -0.4688720703125, -0.4227752685546875, -0.376678466796875, -0.3305816650390625, -0.28448486328125, -0.2383880615234375, -0.192291259765625, -0.1461944580078125, -0.10009765625, -0.0540008544921875, -0.007904052734375, 0.0381927490234375, 0.08428955078125, 0.1303863525390625, 0.176483154296875, 0.2225799560546875, 0.2686767578125, 0.3147735595703125, 0.360870361328125, 0.4069671630859375, 0.45306396484375, 0.4991607666015625, 0.545257568359375, 0.5913543701171875, 0.637451171875, 0.6835479736328125, 0.729644775390625, 0.7757415771484375, 0.82183837890625, 0.8679351806640625, 0.914031982421875, 0.9601287841796875, 1.0062255859375, 1.0523223876953125, 1.098419189453125, 1.1445159912109375, 1.19061279296875, 1.2367095947265625, 1.282806396484375, 1.3289031982421875, 1.375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 3.0, 11.0, 9.0, 6.0, 15.0, 16.0, 11.0, 15.0, 20.0, 27.0, 32.0, 39.0, 44.0, 34.0, 35.0, 53.0, 48.0, 49.0, 58.0, 61.0, 48.0, 45.0, 42.0, 43.0, 39.0, 26.0, 22.0, 31.0, 17.0, 20.0, 16.0, 17.0, 13.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.601898193359375, -0.58123779296875, -0.560577392578125, -0.5399169921875, -0.519256591796875, -0.49859619140625, -0.477935791015625, -0.457275390625, -0.436614990234375, -0.41595458984375, -0.395294189453125, -0.3746337890625, -0.353973388671875, -0.33331298828125, -0.312652587890625, -0.2919921875, -0.271331787109375, -0.25067138671875, -0.230010986328125, -0.2093505859375, -0.188690185546875, -0.16802978515625, -0.147369384765625, -0.126708984375, -0.106048583984375, -0.08538818359375, -0.064727783203125, -0.0440673828125, -0.023406982421875, -0.00274658203125, 0.017913818359375, 0.03857421875, 0.059234619140625, 0.07989501953125, 0.100555419921875, 0.1212158203125, 0.141876220703125, 0.16253662109375, 0.183197021484375, 0.203857421875, 0.224517822265625, 0.24517822265625, 0.265838623046875, 0.2864990234375, 0.307159423828125, 0.32781982421875, 0.348480224609375, 0.369140625, 0.389801025390625, 0.41046142578125, 0.431121826171875, 0.4517822265625, 0.472442626953125, 0.49310302734375, 0.513763427734375, 0.534423828125, 0.555084228515625, 0.57574462890625, 0.596405029296875, 0.6170654296875, 0.637725830078125, 0.65838623046875, 0.679046630859375, 0.69970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 11.0, 10.0, 27.0, 45.0, 78.0, 124.0, 240.0, 399.0, 1020.0, 2681.0, 9628.0, 70576.0, 821431.0, 123401.0, 13391.0, 3264.0, 1138.0, 472.0, 247.0, 123.0, 72.0, 50.0, 30.0, 25.0, 15.0, 15.0, 2.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15262222290039062, -0.14728546142578125, -0.14194869995117188, -0.1366119384765625, -0.13127517700195312, -0.12593841552734375, -0.12060165405273438, -0.115264892578125, -0.10992813110351562, -0.10459136962890625, -0.09925460815429688, -0.0939178466796875, -0.08858108520507812, -0.08324432373046875, -0.07790756225585938, -0.07257080078125, -0.06723403930664062, -0.06189727783203125, -0.056560516357421875, -0.0512237548828125, -0.045886993408203125, -0.04055023193359375, -0.035213470458984375, -0.029876708984375, -0.024539947509765625, -0.01920318603515625, -0.013866424560546875, -0.0085296630859375, -0.003192901611328125, 0.00214385986328125, 0.007480621337890625, 0.0128173828125, 0.018154144287109375, 0.02349090576171875, 0.028827667236328125, 0.0341644287109375, 0.039501190185546875, 0.04483795166015625, 0.050174713134765625, 0.055511474609375, 0.060848236083984375, 0.06618499755859375, 0.07152175903320312, 0.0768585205078125, 0.08219528198242188, 0.08753204345703125, 0.09286880493164062, 0.09820556640625, 0.10354232788085938, 0.10887908935546875, 0.11421585083007812, 0.1195526123046875, 0.12488937377929688, 0.13022613525390625, 0.13556289672851562, 0.140899658203125, 0.14623641967773438, 0.15157318115234375, 0.15690994262695312, 0.1622467041015625, 0.16758346557617188, 0.17292022705078125, 0.17825698852539062, 0.18359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 11.0, 20.0, 17.0, 33.0, 47.0, 78.0, 108.0, 133.0, 158.0, 139.0, 82.0, 64.0, 47.0, 32.0, 13.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7463229596614838e-05, -1.6866251826286316e-05, -1.6269274055957794e-05, -1.5672296285629272e-05, -1.507531851530075e-05, -1.4478340744972229e-05, -1.3881362974643707e-05, -1.3284385204315186e-05, -1.2687407433986664e-05, -1.2090429663658142e-05, -1.149345189332962e-05, -1.0896474123001099e-05, -1.0299496352672577e-05, -9.702518582344055e-06, -9.105540812015533e-06, -8.508563041687012e-06, -7.91158527135849e-06, -7.314607501029968e-06, -6.7176297307014465e-06, -6.120651960372925e-06, -5.523674190044403e-06, -4.926696419715881e-06, -4.32971864938736e-06, -3.732740879058838e-06, -3.135763108730316e-06, -2.5387853384017944e-06, -1.9418075680732727e-06, -1.344829797744751e-06, -7.478520274162292e-07, -1.5087425708770752e-07, 4.461035132408142e-07, 1.043081283569336e-06, 1.6400590538978577e-06, 2.2370368242263794e-06, 2.834014594554901e-06, 3.430992364883423e-06, 4.027970135211945e-06, 4.624947905540466e-06, 5.221925675868988e-06, 5.81890344619751e-06, 6.4158812165260315e-06, 7.012858986854553e-06, 7.609836757183075e-06, 8.206814527511597e-06, 8.803792297840118e-06, 9.40077006816864e-06, 9.997747838497162e-06, 1.0594725608825684e-05, 1.1191703379154205e-05, 1.1788681149482727e-05, 1.2385658919811249e-05, 1.298263669013977e-05, 1.3579614460468292e-05, 1.4176592230796814e-05, 1.4773570001125336e-05, 1.5370547771453857e-05, 1.596752554178238e-05, 1.65645033121109e-05, 1.7161481082439423e-05, 1.7758458852767944e-05, 1.8355436623096466e-05, 1.8952414393424988e-05, 1.954939216375351e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 12.0, 13.0, 15.0, 19.0, 28.0, 58.0, 90.0, 215.0, 562.0, 2878.0, 49304.0, 972425.0, 20064.0, 2009.0, 465.0, 176.0, 80.0, 48.0, 34.0, 16.0, 9.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.4215507507324219, -0.40853118896484375, -0.3955116271972656, -0.3824920654296875, -0.3694725036621094, -0.35645294189453125, -0.3434333801269531, -0.330413818359375, -0.3173942565917969, -0.30437469482421875, -0.2913551330566406, -0.2783355712890625, -0.2653160095214844, -0.25229644775390625, -0.23927688598632812, -0.22625732421875, -0.21323776245117188, -0.20021820068359375, -0.18719863891601562, -0.1741790771484375, -0.16115951538085938, -0.14813995361328125, -0.13512039184570312, -0.122100830078125, -0.10908126831054688, -0.09606170654296875, -0.08304214477539062, -0.0700225830078125, -0.057003021240234375, -0.04398345947265625, -0.030963897705078125, -0.0179443359375, -0.004924774169921875, 0.00809478759765625, 0.021114349365234375, 0.0341339111328125, 0.047153472900390625, 0.06017303466796875, 0.07319259643554688, 0.086212158203125, 0.09923171997070312, 0.11225128173828125, 0.12527084350585938, 0.1382904052734375, 0.15130996704101562, 0.16432952880859375, 0.17734909057617188, 0.19036865234375, 0.20338821411132812, 0.21640777587890625, 0.22942733764648438, 0.2424468994140625, 0.2554664611816406, 0.26848602294921875, 0.2815055847167969, 0.294525146484375, 0.3075447082519531, 0.32056427001953125, 0.3335838317871094, 0.3466033935546875, 0.3596229553222656, 0.37264251708984375, 0.3856620788574219, 0.398681640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 8.0, 24.0, 29.0, 31.0, 60.0, 57.0, 87.0, 97.0, 110.0, 104.0, 90.0, 78.0, 53.0, 40.0, 24.0, 25.0, 12.0, 11.0, 8.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1566162109375, -0.1513347625732422, -0.14605331420898438, -0.14077186584472656, -0.13549041748046875, -0.13020896911621094, -0.12492752075195312, -0.11964607238769531, -0.1143646240234375, -0.10908317565917969, -0.10380172729492188, -0.09852027893066406, -0.09323883056640625, -0.08795738220214844, -0.08267593383789062, -0.07739448547363281, -0.072113037109375, -0.06683158874511719, -0.061550140380859375, -0.05626869201660156, -0.05098724365234375, -0.04570579528808594, -0.040424346923828125, -0.03514289855957031, -0.0298614501953125, -0.024580001831054688, -0.019298553466796875, -0.014017105102539062, -0.00873565673828125, -0.0034542083740234375, 0.001827239990234375, 0.0071086883544921875, 0.01239013671875, 0.017671585083007812, 0.022953033447265625, 0.028234481811523438, 0.03351593017578125, 0.03879737854003906, 0.044078826904296875, 0.04936027526855469, 0.0546417236328125, 0.05992317199707031, 0.06520462036132812, 0.07048606872558594, 0.07576751708984375, 0.08104896545410156, 0.08633041381835938, 0.09161186218261719, 0.096893310546875, 0.10217475891113281, 0.10745620727539062, 0.11273765563964844, 0.11801910400390625, 0.12330055236816406, 0.12858200073242188, 0.1338634490966797, 0.1391448974609375, 0.1444263458251953, 0.14970779418945312, 0.15498924255371094, 0.16027069091796875, 0.16555213928222656, 0.17083358764648438, 0.1761150360107422, 0.181396484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 20.0, 30.0, 73.0, 171.0, 334.0, 195.0, 78.0, 36.0, 26.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.589051246643066, -5.455007553100586, -5.320964336395264, -5.186920642852783, -5.052877426147461, -4.9188337326049805, -4.784790515899658, -4.650746822357178, -4.5167036056518555, -4.382659912109375, -4.248616695404053, -4.114573001861572, -3.98052978515625, -3.8464863300323486, -3.7124428749084473, -3.578399181365967, -3.4443557262420654, -3.310312271118164, -3.1762688159942627, -3.0422253608703613, -2.90818190574646, -2.7741384506225586, -2.640094757080078, -2.506051540374756, -2.3720078468322754, -2.237964391708374, -2.1039209365844727, -1.9698774814605713, -1.83583402633667, -1.7017905712127686, -1.5677469968795776, -1.4337035417556763, -1.2996599674224854, -1.165616512298584, -1.0315730571746826, -0.8975295424461365, -0.7634860873222351, -0.6294426321983337, -0.4953991174697876, -0.36135566234588623, -0.22731220722198486, -0.0932687371969223, 0.04077473282814026, 0.174818217754364, 0.3088616728782654, 0.44290512800216675, 0.5769486427307129, 0.7109920978546143, 0.8450355529785156, 0.979079008102417, 1.1131224632263184, 1.2471659183502197, 1.381209373474121, 1.5152528285980225, 1.6492964029312134, 1.7833398580551147, 1.9173833131790161, 2.051426887512207, 2.1854703426361084, 2.3195137977600098, 2.453557252883911, 2.5876007080078125, 2.721644163131714, 2.8556876182556152, 2.9897310733795166]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 18.0, 16.0, 18.0, 24.0, 24.0, 31.0, 31.0, 33.0, 43.0, 45.0, 48.0, 51.0, 44.0, 54.0, 60.0, 47.0, 49.0, 37.0, 35.0, 35.0, 31.0, 28.0, 28.0, 20.0, 24.0, 21.0, 14.0, 14.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11759090423584, -3.0048656463623047, -2.8921406269073486, -2.7794156074523926, -2.6666903495788574, -2.5539650917053223, -2.441240072250366, -2.32851505279541, -2.215789794921875, -2.10306453704834, -1.9903395175933838, -1.8776143789291382, -1.7648892402648926, -1.652164101600647, -1.5394389629364014, -1.4267138242721558, -1.3139886856079102, -1.2012635469436646, -1.088538408279419, -0.9758132696151733, -0.8630881309509277, -0.7503629922866821, -0.6376378536224365, -0.5249127149581909, -0.4121875762939453, -0.2994624376296997, -0.1867372989654541, -0.0740121603012085, 0.03871297836303711, 0.15143811702728271, 0.2641632556915283, 0.3768883943557739, 0.48961353302001953, 0.6023386716842651, 0.7150638103485107, 0.8277889490127563, 0.940514087677002, 1.0532392263412476, 1.1659643650054932, 1.2786895036697388, 1.3914146423339844, 1.50413978099823, 1.6168649196624756, 1.7295900583267212, 1.8423151969909668, 1.9550403356552124, 2.067765474319458, 2.180490493774414, 2.293215751647949, 2.4059410095214844, 2.5186660289764404, 2.6313910484313965, 2.7441163063049316, 2.856841564178467, 2.969566583633423, 3.082291603088379, 3.195016860961914, 3.307742118835449, 3.4204671382904053, 3.5331921577453613, 3.6459174156188965, 3.7586426734924316, 3.8713676929473877, 3.9840927124023438, 4.096817970275879]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 11.0, 21.0, 53.0, 233.0, 2143.0, 4190961.0, 684.0, 105.0, 34.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.29296875, -7.1246337890625, -6.956298828125, -6.7879638671875, -6.61962890625, -6.4512939453125, -6.282958984375, -6.1146240234375, -5.9462890625, -5.7779541015625, -5.609619140625, -5.4412841796875, -5.27294921875, -5.1046142578125, -4.936279296875, -4.7679443359375, -4.599609375, -4.4312744140625, -4.262939453125, -4.0946044921875, -3.92626953125, -3.7579345703125, -3.589599609375, -3.4212646484375, -3.2529296875, -3.0845947265625, -2.916259765625, -2.7479248046875, -2.57958984375, -2.4112548828125, -2.242919921875, -2.0745849609375, -1.90625, -1.7379150390625, -1.569580078125, -1.4012451171875, -1.23291015625, -1.0645751953125, -0.896240234375, -0.7279052734375, -0.5595703125, -0.3912353515625, -0.222900390625, -0.0545654296875, 0.11376953125, 0.2821044921875, 0.450439453125, 0.6187744140625, 0.787109375, 0.9554443359375, 1.123779296875, 1.2921142578125, 1.46044921875, 1.6287841796875, 1.797119140625, 1.9654541015625, 2.1337890625, 2.3021240234375, 2.470458984375, 2.6387939453125, 2.80712890625, 2.9754638671875, 3.143798828125, 3.3121337890625, 3.48046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 17.0, 74.0, 179.0, 351.0, 248.0, 79.0, 26.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.7013053894042969, -0.6848373413085938, -0.6683692932128906, -0.6519012451171875, -0.6354331970214844, -0.6189651489257812, -0.6024971008300781, -0.586029052734375, -0.5695610046386719, -0.5530929565429688, -0.5366249084472656, -0.5201568603515625, -0.5036888122558594, -0.48722076416015625, -0.4707527160644531, -0.45428466796875, -0.4378166198730469, -0.42134857177734375, -0.4048805236816406, -0.3884124755859375, -0.3719444274902344, -0.35547637939453125, -0.3390083312988281, -0.322540283203125, -0.3060722351074219, -0.28960418701171875, -0.2731361389160156, -0.2566680908203125, -0.24020004272460938, -0.22373199462890625, -0.20726394653320312, -0.1907958984375, -0.17432785034179688, -0.15785980224609375, -0.14139175415039062, -0.1249237060546875, -0.10845565795898438, -0.09198760986328125, -0.07551956176757812, -0.059051513671875, -0.042583465576171875, -0.02611541748046875, -0.009647369384765625, 0.0068206787109375, 0.023288726806640625, 0.03975677490234375, 0.056224822998046875, 0.07269287109375, 0.08916091918945312, 0.10562896728515625, 0.12209701538085938, 0.1385650634765625, 0.15503311157226562, 0.17150115966796875, 0.18796920776367188, 0.204437255859375, 0.22090530395507812, 0.23737335205078125, 0.2538414001464844, 0.2703094482421875, 0.2867774963378906, 0.30324554443359375, 0.3197135925292969, 0.336181640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 8.0, 10.0, 27.0, 50.0, 81.0, 177.0, 428.0, 1198.0, 4495.0, 49177.0, 4115217.0, 19232.0, 2854.0, 772.0, 264.0, 131.0, 61.0, 34.0, 27.0, 13.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.965850830078125, -0.93853759765625, -0.911224365234375, -0.8839111328125, -0.856597900390625, -0.82928466796875, -0.801971435546875, -0.774658203125, -0.747344970703125, -0.72003173828125, -0.692718505859375, -0.6654052734375, -0.638092041015625, -0.61077880859375, -0.583465576171875, -0.55615234375, -0.528839111328125, -0.50152587890625, -0.474212646484375, -0.4468994140625, -0.419586181640625, -0.39227294921875, -0.364959716796875, -0.337646484375, -0.310333251953125, -0.28302001953125, -0.255706787109375, -0.2283935546875, -0.201080322265625, -0.17376708984375, -0.146453857421875, -0.119140625, -0.091827392578125, -0.06451416015625, -0.037200927734375, -0.0098876953125, 0.017425537109375, 0.04473876953125, 0.072052001953125, 0.099365234375, 0.126678466796875, 0.15399169921875, 0.181304931640625, 0.2086181640625, 0.235931396484375, 0.26324462890625, 0.290557861328125, 0.31787109375, 0.345184326171875, 0.37249755859375, 0.399810791015625, 0.4271240234375, 0.454437255859375, 0.48175048828125, 0.509063720703125, 0.536376953125, 0.563690185546875, 0.59100341796875, 0.618316650390625, 0.6456298828125, 0.672943115234375, 0.70025634765625, 0.727569580078125, 0.7548828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 11.0, 7.0, 10.0, 18.0, 45.0, 106.0, 1009.0, 2657.0, 115.0, 35.0, 23.0, 16.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18136024475097656, -0.17412185668945312, -0.1668834686279297, -0.15964508056640625, -0.1524066925048828, -0.14516830444335938, -0.13792991638183594, -0.1306915283203125, -0.12345314025878906, -0.11621475219726562, -0.10897636413574219, -0.10173797607421875, -0.09449958801269531, -0.08726119995117188, -0.08002281188964844, -0.072784423828125, -0.06554603576660156, -0.058307647705078125, -0.05106925964355469, -0.04383087158203125, -0.03659248352050781, -0.029354095458984375, -0.022115707397460938, -0.0148773193359375, -0.0076389312744140625, -0.000400543212890625, 0.0068378448486328125, 0.01407623291015625, 0.021314620971679688, 0.028553009033203125, 0.03579139709472656, 0.04302978515625, 0.05026817321777344, 0.057506561279296875, 0.06474494934082031, 0.07198333740234375, 0.07922172546386719, 0.08646011352539062, 0.09369850158691406, 0.1009368896484375, 0.10817527770996094, 0.11541366577148438, 0.12265205383300781, 0.12989044189453125, 0.1371288299560547, 0.14436721801757812, 0.15160560607910156, 0.158843994140625, 0.16608238220214844, 0.17332077026367188, 0.1805591583251953, 0.18779754638671875, 0.1950359344482422, 0.20227432250976562, 0.20951271057128906, 0.2167510986328125, 0.22398948669433594, 0.23122787475585938, 0.2384662628173828, 0.24570465087890625, 0.2529430389404297, 0.2601814270019531, 0.26741981506347656, 0.274658203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 165.0, 847.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3448017835617065, -1.1571334600448608, -0.9694650173187256, -0.7817966938018799, -0.5941283106803894, -0.4064599275588989, -0.21879160404205322, -0.03112316131591797, 0.15654516220092773, 0.3442135453224182, 0.5318819284439087, 0.7195502519607544, 0.9072186350822449, 1.0948870182037354, 1.282555341720581, 1.4702237844467163, 1.657892107963562, 1.8455604314804077, 2.033228874206543, 2.2208971977233887, 2.4085655212402344, 2.59623384475708, 2.783902168273926, 2.9715707302093506, 3.1592390537261963, 3.346907377243042, 3.5345757007598877, 3.7222442626953125, 3.909912586212158, 4.097580909729004, 4.28524923324585, 4.472917556762695, 4.660585880279541, 4.848254203796387, 5.035922527313232, 5.223590850830078, 5.411259174346924, 5.5989274978637695, 5.786596298217773, 5.974264621734619, 6.161932945251465, 6.3496012687683105, 6.537269592285156, 6.724937915802002, 6.912606239318848, 7.100275039672852, 7.287942886352539, 7.475611686706543, 7.6632795333862305, 7.850947856903076, 8.038616180419922, 8.226284980773926, 8.413952827453613, 8.601621627807617, 8.789289474487305, 8.976958274841309, 9.164627075195312, 9.352295875549316, 9.539963722229004, 9.727632522583008, 9.915300369262695, 10.1029691696167, 10.290637016296387, 10.47830581665039, 10.665973663330078]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 10.0, 16.0, 18.0, 23.0, 30.0, 37.0, 35.0, 50.0, 61.0, 43.0, 51.0, 74.0, 68.0, 65.0, 71.0, 54.0, 43.0, 50.0, 38.0, 31.0, 19.0, 15.0, 20.0, 21.0, 13.0, 6.0, 7.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47241783142089844, -0.4569101929664612, -0.4414025545120239, -0.42589494585990906, -0.4103873074054718, -0.39487966895103455, -0.3793720602989197, -0.3638644218444824, -0.34835678339004517, -0.3328491449356079, -0.31734150648117065, -0.3018338978290558, -0.28632625937461853, -0.2708186209201813, -0.2553110122680664, -0.23980337381362915, -0.2242957353591919, -0.20878809690475464, -0.19328047335147858, -0.17777284979820251, -0.16226521134376526, -0.146757572889328, -0.13124994933605194, -0.11574231833219528, -0.10023468732833862, -0.08472705632448196, -0.0692194253206253, -0.053711794316768646, -0.03820416331291199, -0.02269653230905533, -0.007188901305198669, 0.00831872969865799, 0.02382636070251465, 0.03933399170637131, 0.054841622710227966, 0.07034925371408463, 0.08585688471794128, 0.10136451572179794, 0.1168721467256546, 0.13237977027893066, 0.14788740873336792, 0.16339504718780518, 0.17890267074108124, 0.1944102942943573, 0.20991793274879456, 0.2254255712032318, 0.24093319475650787, 0.25644081830978394, 0.2719484567642212, 0.28745609521865845, 0.3029637336730957, 0.31847134232521057, 0.3339789807796478, 0.3494866192340851, 0.36499422788619995, 0.3805018663406372, 0.39600950479507446, 0.4115171432495117, 0.427024781703949, 0.44253239035606384, 0.4580400288105011, 0.47354766726493835, 0.4890552759170532, 0.5045629143714905, 0.5200705528259277]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 3.0, 11.0, 9.0, 7.0, 10.0, 22.0, 27.0, 29.0, 32.0, 56.0, 88.0, 136.0, 183.0, 380.0, 615.0, 1332.0, 3474.0, 24567.0, 927429.0, 80722.0, 5634.0, 1781.0, 823.0, 406.0, 264.0, 165.0, 96.0, 56.0, 48.0, 34.0, 24.0, 14.0, 11.0, 13.0, 8.0, 6.0, 9.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.3041534423828125, -1.261627197265625, -1.2191009521484375, -1.17657470703125, -1.1340484619140625, -1.091522216796875, -1.0489959716796875, -1.0064697265625, -0.9639434814453125, -0.921417236328125, -0.8788909912109375, -0.83636474609375, -0.7938385009765625, -0.751312255859375, -0.7087860107421875, -0.666259765625, -0.6237335205078125, -0.581207275390625, -0.5386810302734375, -0.49615478515625, -0.4536285400390625, -0.411102294921875, -0.3685760498046875, -0.3260498046875, -0.2835235595703125, -0.240997314453125, -0.1984710693359375, -0.15594482421875, -0.1134185791015625, -0.070892333984375, -0.0283660888671875, 0.01416015625, 0.0566864013671875, 0.099212646484375, 0.1417388916015625, 0.18426513671875, 0.2267913818359375, 0.269317626953125, 0.3118438720703125, 0.3543701171875, 0.3968963623046875, 0.439422607421875, 0.4819488525390625, 0.52447509765625, 0.5670013427734375, 0.609527587890625, 0.6520538330078125, 0.694580078125, 0.7371063232421875, 0.779632568359375, 0.8221588134765625, 0.86468505859375, 0.9072113037109375, 0.949737548828125, 0.9922637939453125, 1.0347900390625, 1.0773162841796875, 1.119842529296875, 1.1623687744140625, 1.20489501953125, 1.2474212646484375, 1.289947509765625, 1.3324737548828125, 1.375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 22.0, 79.0, 217.0, 346.0, 221.0, 69.0, 22.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.693145751953125, -0.67681884765625, -0.660491943359375, -0.6441650390625, -0.627838134765625, -0.61151123046875, -0.595184326171875, -0.578857421875, -0.562530517578125, -0.54620361328125, -0.529876708984375, -0.5135498046875, -0.497222900390625, -0.48089599609375, -0.464569091796875, -0.4482421875, -0.431915283203125, -0.41558837890625, -0.399261474609375, -0.3829345703125, -0.366607666015625, -0.35028076171875, -0.333953857421875, -0.317626953125, -0.301300048828125, -0.28497314453125, -0.268646240234375, -0.2523193359375, -0.235992431640625, -0.21966552734375, -0.203338623046875, -0.18701171875, -0.170684814453125, -0.15435791015625, -0.138031005859375, -0.1217041015625, -0.105377197265625, -0.08905029296875, -0.072723388671875, -0.056396484375, -0.040069580078125, -0.02374267578125, -0.007415771484375, 0.0089111328125, 0.025238037109375, 0.04156494140625, 0.057891845703125, 0.07421875, 0.090545654296875, 0.10687255859375, 0.123199462890625, 0.1395263671875, 0.155853271484375, 0.17218017578125, 0.188507080078125, 0.204833984375, 0.221160888671875, 0.23748779296875, 0.253814697265625, 0.2701416015625, 0.286468505859375, 0.30279541015625, 0.319122314453125, 0.33544921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 9.0, 8.0, 8.0, 13.0, 20.0, 22.0, 20.0, 27.0, 46.0, 67.0, 117.0, 179.0, 347.0, 915.0, 3391.0, 19494.0, 259359.0, 716084.0, 40300.0, 5624.0, 1375.0, 443.0, 230.0, 132.0, 85.0, 53.0, 34.0, 24.0, 19.0, 12.0, 13.0, 11.0, 6.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.00390625, -0.9706268310546875, -0.937347412109375, -0.9040679931640625, -0.87078857421875, -0.8375091552734375, -0.804229736328125, -0.7709503173828125, -0.7376708984375, -0.7043914794921875, -0.671112060546875, -0.6378326416015625, -0.60455322265625, -0.5712738037109375, -0.537994384765625, -0.5047149658203125, -0.471435546875, -0.4381561279296875, -0.404876708984375, -0.3715972900390625, -0.33831787109375, -0.3050384521484375, -0.271759033203125, -0.2384796142578125, -0.2052001953125, -0.1719207763671875, -0.138641357421875, -0.1053619384765625, -0.07208251953125, -0.0388031005859375, -0.005523681640625, 0.0277557373046875, 0.06103515625, 0.0943145751953125, 0.127593994140625, 0.1608734130859375, 0.19415283203125, 0.2274322509765625, 0.260711669921875, 0.2939910888671875, 0.3272705078125, 0.3605499267578125, 0.393829345703125, 0.4271087646484375, 0.46038818359375, 0.4936676025390625, 0.526947021484375, 0.5602264404296875, 0.593505859375, 0.6267852783203125, 0.660064697265625, 0.6933441162109375, 0.72662353515625, 0.7599029541015625, 0.793182373046875, 0.8264617919921875, 0.8597412109375, 0.8930206298828125, 0.926300048828125, 0.9595794677734375, 0.99285888671875, 1.0261383056640625, 1.059417724609375, 1.0926971435546875, 1.1259765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 10.0, 14.0, 12.0, 16.0, 19.0, 24.0, 33.0, 27.0, 37.0, 48.0, 51.0, 45.0, 49.0, 36.0, 42.0, 41.0, 49.0, 53.0, 47.0, 40.0, 44.0, 35.0, 23.0, 29.0, 19.0, 17.0, 17.0, 22.0, 6.0, 8.0, 9.0, 13.0, 5.0, 2.0, 11.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6125640869140625, -0.593780517578125, -0.5749969482421875, -0.55621337890625, -0.5374298095703125, -0.518646240234375, -0.4998626708984375, -0.4810791015625, -0.4622955322265625, -0.443511962890625, -0.4247283935546875, -0.40594482421875, -0.3871612548828125, -0.368377685546875, -0.3495941162109375, -0.330810546875, -0.3120269775390625, -0.293243408203125, -0.2744598388671875, -0.25567626953125, -0.2368927001953125, -0.218109130859375, -0.1993255615234375, -0.1805419921875, -0.1617584228515625, -0.142974853515625, -0.1241912841796875, -0.10540771484375, -0.0866241455078125, -0.067840576171875, -0.0490570068359375, -0.0302734375, -0.0114898681640625, 0.007293701171875, 0.0260772705078125, 0.04486083984375, 0.0636444091796875, 0.082427978515625, 0.1012115478515625, 0.1199951171875, 0.1387786865234375, 0.157562255859375, 0.1763458251953125, 0.19512939453125, 0.2139129638671875, 0.232696533203125, 0.2514801025390625, 0.270263671875, 0.2890472412109375, 0.307830810546875, 0.3266143798828125, 0.34539794921875, 0.3641815185546875, 0.382965087890625, 0.4017486572265625, 0.4205322265625, 0.4393157958984375, 0.458099365234375, 0.4768829345703125, 0.49566650390625, 0.5144500732421875, 0.533233642578125, 0.5520172119140625, 0.57080078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 20.0, 41.0, 63.0, 111.0, 208.0, 443.0, 1179.0, 4575.0, 32712.0, 738718.0, 251722.0, 14512.0, 2664.0, 848.0, 335.0, 162.0, 74.0, 39.0, 31.0, 22.0, 16.0, 12.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.1399250030517578, -0.13470840454101562, -0.12949180603027344, -0.12427520751953125, -0.11905860900878906, -0.11384201049804688, -0.10862541198730469, -0.1034088134765625, -0.09819221496582031, -0.09297561645507812, -0.08775901794433594, -0.08254241943359375, -0.07732582092285156, -0.07210922241210938, -0.06689262390136719, -0.061676025390625, -0.05645942687988281, -0.051242828369140625, -0.04602622985839844, -0.04080963134765625, -0.03559303283691406, -0.030376434326171875, -0.025159835815429688, -0.0199432373046875, -0.014726638793945312, -0.009510040283203125, -0.0042934417724609375, 0.00092315673828125, 0.0061397552490234375, 0.011356353759765625, 0.016572952270507812, 0.02178955078125, 0.027006149291992188, 0.032222747802734375, 0.03743934631347656, 0.04265594482421875, 0.04787254333496094, 0.053089141845703125, 0.05830574035644531, 0.0635223388671875, 0.06873893737792969, 0.07395553588867188, 0.07917213439941406, 0.08438873291015625, 0.08960533142089844, 0.09482192993164062, 0.10003852844238281, 0.105255126953125, 0.11047172546386719, 0.11568832397460938, 0.12090492248535156, 0.12612152099609375, 0.13133811950683594, 0.13655471801757812, 0.1417713165283203, 0.1469879150390625, 0.1522045135498047, 0.15742111206054688, 0.16263771057128906, 0.16785430908203125, 0.17307090759277344, 0.17828750610351562, 0.1835041046142578, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 11.0, 13.0, 12.0, 24.0, 28.0, 31.0, 40.0, 47.0, 38.0, 76.0, 92.0, 79.0, 59.0, 76.0, 69.0, 64.0, 44.0, 42.0, 22.0, 13.0, 21.0, 19.0, 16.0, 8.0, 6.0, 6.0, 1.0, 7.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.120441973209381e-06, -8.823350071907043e-06, -8.526258170604706e-06, -8.229166269302368e-06, -7.93207436800003e-06, -7.634982466697693e-06, -7.337890565395355e-06, -7.040798664093018e-06, -6.74370676279068e-06, -6.446614861488342e-06, -6.149522960186005e-06, -5.852431058883667e-06, -5.555339157581329e-06, -5.258247256278992e-06, -4.961155354976654e-06, -4.664063453674316e-06, -4.366971552371979e-06, -4.069879651069641e-06, -3.7727877497673035e-06, -3.475695848464966e-06, -3.178603947162628e-06, -2.8815120458602905e-06, -2.584420144557953e-06, -2.2873282432556152e-06, -1.9902363419532776e-06, -1.69314444065094e-06, -1.3960525393486023e-06, -1.0989606380462646e-06, -8.01868736743927e-07, -5.047768354415894e-07, -2.076849341392517e-07, 8.940696716308594e-08, 3.864988684654236e-07, 6.835907697677612e-07, 9.806826710700989e-07, 1.2777745723724365e-06, 1.5748664736747742e-06, 1.8719583749771118e-06, 2.1690502762794495e-06, 2.466142177581787e-06, 2.7632340788841248e-06, 3.0603259801864624e-06, 3.3574178814888e-06, 3.6545097827911377e-06, 3.951601684093475e-06, 4.248693585395813e-06, 4.545785486698151e-06, 4.842877388000488e-06, 5.139969289302826e-06, 5.4370611906051636e-06, 5.734153091907501e-06, 6.031244993209839e-06, 6.3283368945121765e-06, 6.625428795814514e-06, 6.922520697116852e-06, 7.2196125984191895e-06, 7.516704499721527e-06, 7.813796401023865e-06, 8.110888302326202e-06, 8.40798020362854e-06, 8.705072104930878e-06, 9.002164006233215e-06, 9.299255907535553e-06, 9.59634780883789e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 24.0, 45.0, 52.0, 105.0, 212.0, 568.0, 1994.0, 12251.0, 391001.0, 623049.0, 15754.0, 2279.0, 629.0, 231.0, 98.0, 62.0, 42.0, 22.0, 24.0, 14.0, 17.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2203369140625, -0.21300506591796875, -0.2056732177734375, -0.19834136962890625, -0.191009521484375, -0.18367767333984375, -0.1763458251953125, -0.16901397705078125, -0.16168212890625, -0.15435028076171875, -0.1470184326171875, -0.13968658447265625, -0.132354736328125, -0.12502288818359375, -0.1176910400390625, -0.11035919189453125, -0.10302734375, -0.09569549560546875, -0.0883636474609375, -0.08103179931640625, -0.073699951171875, -0.06636810302734375, -0.0590362548828125, -0.05170440673828125, -0.04437255859375, -0.03704071044921875, -0.0297088623046875, -0.02237701416015625, -0.015045166015625, -0.00771331787109375, -0.0003814697265625, 0.00695037841796875, 0.0142822265625, 0.02161407470703125, 0.0289459228515625, 0.03627777099609375, 0.043609619140625, 0.05094146728515625, 0.0582733154296875, 0.06560516357421875, 0.07293701171875, 0.08026885986328125, 0.0876007080078125, 0.09493255615234375, 0.102264404296875, 0.10959625244140625, 0.1169281005859375, 0.12425994873046875, 0.131591796875, 0.13892364501953125, 0.1462554931640625, 0.15358734130859375, 0.160919189453125, 0.16825103759765625, 0.1755828857421875, 0.18291473388671875, 0.19024658203125, 0.19757843017578125, 0.2049102783203125, 0.21224212646484375, 0.219573974609375, 0.22690582275390625, 0.2342376708984375, 0.24156951904296875, 0.2489013671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 14.0, 16.0, 12.0, 24.0, 24.0, 31.0, 41.0, 56.0, 65.0, 85.0, 89.0, 109.0, 94.0, 67.0, 59.0, 41.0, 38.0, 29.0, 18.0, 19.0, 16.0, 9.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.1301097869873047, -0.12618637084960938, -0.12226295471191406, -0.11833953857421875, -0.11441612243652344, -0.11049270629882812, -0.10656929016113281, -0.1026458740234375, -0.09872245788574219, -0.09479904174804688, -0.09087562561035156, -0.08695220947265625, -0.08302879333496094, -0.07910537719726562, -0.07518196105957031, -0.071258544921875, -0.06733512878417969, -0.06341171264648438, -0.05948829650878906, -0.05556488037109375, -0.05164146423339844, -0.047718048095703125, -0.04379463195800781, -0.0398712158203125, -0.03594779968261719, -0.032024383544921875, -0.028100967407226562, -0.02417755126953125, -0.020254135131835938, -0.016330718994140625, -0.012407302856445312, -0.00848388671875, -0.0045604705810546875, -0.000637054443359375, 0.0032863616943359375, 0.00720977783203125, 0.011133193969726562, 0.015056610107421875, 0.018980026245117188, 0.0229034423828125, 0.026826858520507812, 0.030750274658203125, 0.03467369079589844, 0.03859710693359375, 0.04252052307128906, 0.046443939208984375, 0.05036735534667969, 0.054290771484375, 0.05821418762207031, 0.062137603759765625, 0.06606101989746094, 0.06998443603515625, 0.07390785217285156, 0.07783126831054688, 0.08175468444824219, 0.0856781005859375, 0.08960151672363281, 0.09352493286132812, 0.09744834899902344, 0.10137176513671875, 0.10529518127441406, 0.10921859741210938, 0.11314201354980469, 0.1170654296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 14.0, 13.0, 24.0, 38.0, 79.0, 178.0, 280.0, 182.0, 75.0, 38.0, 34.0, 19.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.151472091674805, -5.03578519821167, -4.920098304748535, -4.8044114112854, -4.688724517822266, -4.573037624359131, -4.457350730895996, -4.341663837432861, -4.225976943969727, -4.110290050506592, -3.994603157043457, -3.8789162635803223, -3.7632293701171875, -3.6475424766540527, -3.531855583190918, -3.416168689727783, -3.3004820346832275, -3.1847951412200928, -3.069108247756958, -2.9534213542938232, -2.8377344608306885, -2.7220475673675537, -2.606360912322998, -2.4906740188598633, -2.3749871253967285, -2.2593002319335938, -2.143613338470459, -2.027926445007324, -1.9122395515441895, -1.7965526580810547, -1.6808658838272095, -1.5651789903640747, -1.4494922161102295, -1.3338053226470947, -1.21811842918396, -1.1024315357208252, -0.9867447018623352, -0.8710578083992004, -0.7553709745407104, -0.6396840810775757, -0.5239971876144409, -0.40831029415130615, -0.2926234304904938, -0.1769365668296814, -0.06124967336654663, 0.054437220096588135, 0.17012405395507812, 0.2858109474182129, 0.40149784088134766, 0.5171847343444824, 0.6328716278076172, 0.7485584616661072, 0.8642453551292419, 0.9799322485923767, 1.0956190824508667, 1.2113059759140015, 1.3269928693771362, 1.442679762840271, 1.5583666563034058, 1.674053430557251, 1.7897403240203857, 1.9054272174835205, 2.0211141109466553, 2.13680100440979, 2.252487897872925]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 5.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 13.0, 24.0, 40.0, 37.0, 30.0, 44.0, 48.0, 56.0, 49.0, 55.0, 47.0, 43.0, 50.0, 57.0, 60.0, 50.0, 32.0, 25.0, 32.0, 33.0, 19.0, 17.0, 14.0, 15.0, 3.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.053379058837891, -3.934798002243042, -3.8162171840667725, -3.697636127471924, -3.5790553092956543, -3.4604742527008057, -3.341893196105957, -3.2233123779296875, -3.104731321334839, -2.9861502647399902, -2.8675694465637207, -2.748988389968872, -2.6304073333740234, -2.511826515197754, -2.3932454586029053, -2.2746644020080566, -2.156083583831787, -2.0375025272369385, -1.918921709060669, -1.8003406524658203, -1.6817597150802612, -1.5631787776947021, -1.4445977210998535, -1.3260167837142944, -1.2074358463287354, -1.0888549089431763, -0.9702739119529724, -0.8516929149627686, -0.7331119775772095, -0.6145310401916504, -0.49595004320144653, -0.3773690462112427, -0.2587881088256836, -0.14020714163780212, -0.021626174449920654, 0.09695479273796082, 0.21553575992584229, 0.33411669731140137, 0.4526976943016052, 0.5712786912918091, 0.6898596286773682, 0.8084405660629272, 0.9270215630531311, 1.045602560043335, 1.164183497428894, 1.2827644348144531, 1.4013454914093018, 1.5199264287948608, 1.63850736618042, 1.757088303565979, 1.875669240951538, 1.9942502975463867, 2.1128311157226562, 2.231412172317505, 2.3499932289123535, 2.468574047088623, 2.5871551036834717, 2.7057361602783203, 2.82431697845459, 2.9428980350494385, 3.061479091644287, 3.1800599098205566, 3.2986409664154053, 3.417222023010254, 3.5358028411865234]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 12.0, 17.0, 18.0, 20.0, 42.0, 84.0, 145.0, 288.0, 1039.0, 8329.0, 4170192.0, 12353.0, 1152.0, 320.0, 112.0, 55.0, 40.0, 18.0, 13.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.94256591796875, -2.8734130859375, -2.80426025390625, -2.735107421875, -2.66595458984375, -2.5968017578125, -2.52764892578125, -2.45849609375, -2.38934326171875, -2.3201904296875, -2.25103759765625, -2.181884765625, -2.11273193359375, -2.0435791015625, -1.97442626953125, -1.9052734375, -1.83612060546875, -1.7669677734375, -1.69781494140625, -1.628662109375, -1.55950927734375, -1.4903564453125, -1.42120361328125, -1.35205078125, -1.28289794921875, -1.2137451171875, -1.14459228515625, -1.075439453125, -1.00628662109375, -0.9371337890625, -0.86798095703125, -0.798828125, -0.72967529296875, -0.6605224609375, -0.59136962890625, -0.522216796875, -0.45306396484375, -0.3839111328125, -0.31475830078125, -0.24560546875, -0.17645263671875, -0.1072998046875, -0.03814697265625, 0.031005859375, 0.10015869140625, 0.1693115234375, 0.23846435546875, 0.3076171875, 0.37677001953125, 0.4459228515625, 0.51507568359375, 0.584228515625, 0.65338134765625, 0.7225341796875, 0.79168701171875, 0.86083984375, 0.92999267578125, 0.9991455078125, 1.06829833984375, 1.137451171875, 1.20660400390625, 1.2757568359375, 1.34490966796875, 1.4140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 21.0, 75.0, 193.0, 306.0, 261.0, 79.0, 35.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7127761840820312, -0.6960601806640625, -0.6793441772460938, -0.662628173828125, -0.6459121704101562, -0.6291961669921875, -0.6124801635742188, -0.59576416015625, -0.5790481567382812, -0.5623321533203125, -0.5456161499023438, -0.528900146484375, -0.5121841430664062, -0.4954681396484375, -0.47875213623046875, -0.4620361328125, -0.44532012939453125, -0.4286041259765625, -0.41188812255859375, -0.395172119140625, -0.37845611572265625, -0.3617401123046875, -0.34502410888671875, -0.32830810546875, -0.31159210205078125, -0.2948760986328125, -0.27816009521484375, -0.261444091796875, -0.24472808837890625, -0.2280120849609375, -0.21129608154296875, -0.194580078125, -0.17786407470703125, -0.1611480712890625, -0.14443206787109375, -0.127716064453125, -0.11100006103515625, -0.0942840576171875, -0.07756805419921875, -0.06085205078125, -0.04413604736328125, -0.0274200439453125, -0.01070404052734375, 0.006011962890625, 0.02272796630859375, 0.0394439697265625, 0.05615997314453125, 0.0728759765625, 0.08959197998046875, 0.1063079833984375, 0.12302398681640625, 0.139739990234375, 0.15645599365234375, 0.1731719970703125, 0.18988800048828125, 0.20660400390625, 0.22332000732421875, 0.2400360107421875, 0.25675201416015625, 0.273468017578125, 0.29018402099609375, 0.3069000244140625, 0.32361602783203125, 0.34033203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 2.0, 5.0, 7.0, 23.0, 45.0, 89.0, 302.0, 1170.0, 6840.0, 4122682.0, 59438.0, 2796.0, 513.0, 167.0, 93.0, 43.0, 22.0, 22.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.570159912109375, -2.50555419921875, -2.440948486328125, -2.3763427734375, -2.311737060546875, -2.24713134765625, -2.182525634765625, -2.117919921875, -2.053314208984375, -1.98870849609375, -1.924102783203125, -1.8594970703125, -1.794891357421875, -1.73028564453125, -1.665679931640625, -1.60107421875, -1.536468505859375, -1.47186279296875, -1.407257080078125, -1.3426513671875, -1.278045654296875, -1.21343994140625, -1.148834228515625, -1.084228515625, -1.019622802734375, -0.95501708984375, -0.890411376953125, -0.8258056640625, -0.761199951171875, -0.69659423828125, -0.631988525390625, -0.5673828125, -0.502777099609375, -0.43817138671875, -0.373565673828125, -0.3089599609375, -0.244354248046875, -0.17974853515625, -0.115142822265625, -0.050537109375, 0.014068603515625, 0.07867431640625, 0.143280029296875, 0.2078857421875, 0.272491455078125, 0.33709716796875, 0.401702880859375, 0.46630859375, 0.530914306640625, 0.59552001953125, 0.660125732421875, 0.7247314453125, 0.789337158203125, 0.85394287109375, 0.918548583984375, 0.983154296875, 1.047760009765625, 1.11236572265625, 1.176971435546875, 1.2415771484375, 1.306182861328125, 1.37078857421875, 1.435394287109375, 1.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 17.0, 29.0, 91.0, 271.0, 3305.0, 228.0, 53.0, 29.0, 11.0, 9.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4466972351074219, -0.42684173583984375, -0.4069862365722656, -0.3871307373046875, -0.3672752380371094, -0.34741973876953125, -0.3275642395019531, -0.307708740234375, -0.2878532409667969, -0.26799774169921875, -0.24814224243164062, -0.2282867431640625, -0.20843124389648438, -0.18857574462890625, -0.16872024536132812, -0.14886474609375, -0.12900924682617188, -0.10915374755859375, -0.08929824829101562, -0.0694427490234375, -0.049587249755859375, -0.02973175048828125, -0.009876251220703125, 0.009979248046875, 0.029834747314453125, 0.04969024658203125, 0.06954574584960938, 0.0894012451171875, 0.10925674438476562, 0.12911224365234375, 0.14896774291992188, 0.1688232421875, 0.18867874145507812, 0.20853424072265625, 0.22838973999023438, 0.2482452392578125, 0.2681007385253906, 0.28795623779296875, 0.3078117370605469, 0.327667236328125, 0.3475227355957031, 0.36737823486328125, 0.3872337341308594, 0.4070892333984375, 0.4269447326660156, 0.44680023193359375, 0.4666557312011719, 0.48651123046875, 0.5063667297363281, 0.5262222290039062, 0.5460777282714844, 0.5659332275390625, 0.5857887268066406, 0.6056442260742188, 0.6254997253417969, 0.645355224609375, 0.6652107238769531, 0.6850662231445312, 0.7049217224121094, 0.7247772216796875, 0.7446327209472656, 0.7644882202148438, 0.7843437194824219, 0.80419921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 10.0, 50.0, 431.0, 431.0, 50.0, 18.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220455169677734, -4.1127448081970215, -4.005034446716309, -3.8973240852355957, -3.789613723754883, -3.68190336227417, -3.574192762374878, -3.466482400894165, -3.358772039413452, -3.2510616779327393, -3.1433513164520264, -3.0356409549713135, -2.9279303550720215, -2.8202199935913086, -2.7125096321105957, -2.604799270629883, -2.49708890914917, -2.389378547668457, -2.281668186187744, -2.1739578247070312, -2.0662474632263184, -1.958536982536316, -1.8508265018463135, -1.7431161403656006, -1.6354057788848877, -1.5276954174041748, -1.419985055923462, -1.3122745752334595, -1.2045642137527466, -1.0968538522720337, -0.989143431186676, -0.8814330101013184, -0.7737228870391846, -0.6660125255584717, -0.558302104473114, -0.45059171319007874, -0.34288132190704346, -0.23517096042633057, -0.1274605393409729, -0.019750118255615234, 0.08796024322509766, 0.19567063450813293, 0.3033810257911682, 0.4110914170742035, 0.5188018083572388, 0.6265121698379517, 0.7342225909233093, 0.841933012008667, 0.9496433734893799, 1.0573537349700928, 1.1650640964508057, 1.272774577140808, 1.380484938621521, 1.4881953001022339, 1.5959057807922363, 1.7036161422729492, 1.811326503753662, 1.919036865234375, 2.026747226715088, 2.134457588195801, 2.2421679496765137, 2.3498783111572266, 2.4575889110565186, 2.5652992725372314, 2.6730096340179443]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 26.0, 33.0, 64.0, 95.0, 107.0, 133.0, 119.0, 110.0, 116.0, 75.0, 57.0, 27.0, 19.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8339438438415527, -2.7609875202178955, -2.6880311965942383, -2.615074634552002, -2.5421183109283447, -2.4691619873046875, -2.3962056636810303, -2.323249340057373, -2.2502927780151367, -2.1773364543914795, -2.1043801307678223, -2.031423568725586, -1.9584672451019287, -1.8855109214782715, -1.8125545978546143, -1.7395981550216675, -1.6666418313980103, -1.593685507774353, -1.5207290649414062, -1.447772741317749, -1.3748162984848022, -1.301859974861145, -1.2289035320281982, -1.155947208404541, -1.0829908847808838, -1.0100345611572266, -0.9370781183242798, -0.8641217947006226, -0.7911653518676758, -0.7182090282440186, -0.6452526450157166, -0.5722962617874146, -0.4993398189544678, -0.42638343572616577, -0.35342705249786377, -0.28047069907188416, -0.20751431584358215, -0.13455793261528015, -0.06160157918930054, 0.011354804039001465, 0.08431118726730347, 0.15726757049560547, 0.23022393882274628, 0.3031803071498871, 0.3761366903781891, 0.4490930736064911, 0.5220494270324707, 0.5950058102607727, 0.6679621934890747, 0.7409185767173767, 0.8138749599456787, 0.8868312835693359, 0.9597877264022827, 1.03274405002594, 1.1057004928588867, 1.178656816482544, 1.2516131401062012, 1.3245694637298584, 1.3975259065628052, 1.4704822301864624, 1.5434386730194092, 1.6163949966430664, 1.6893513202667236, 1.7623077630996704, 1.8352642059326172]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 7.0, 18.0, 10.0, 14.0, 29.0, 24.0, 46.0, 53.0, 107.0, 169.0, 284.0, 542.0, 1012.0, 2544.0, 12164.0, 764936.0, 254048.0, 8391.0, 2125.0, 874.0, 437.0, 264.0, 142.0, 93.0, 52.0, 41.0, 27.0, 24.0, 13.0, 11.0, 7.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.107421875, -2.0452728271484375, -1.983123779296875, -1.9209747314453125, -1.85882568359375, -1.7966766357421875, -1.734527587890625, -1.6723785400390625, -1.6102294921875, -1.5480804443359375, -1.485931396484375, -1.4237823486328125, -1.36163330078125, -1.2994842529296875, -1.237335205078125, -1.1751861572265625, -1.113037109375, -1.0508880615234375, -0.988739013671875, -0.9265899658203125, -0.86444091796875, -0.8022918701171875, -0.740142822265625, -0.6779937744140625, -0.6158447265625, -0.5536956787109375, -0.491546630859375, -0.4293975830078125, -0.36724853515625, -0.3050994873046875, -0.242950439453125, -0.1808013916015625, -0.11865234375, -0.0565032958984375, 0.005645751953125, 0.0677947998046875, 0.12994384765625, 0.1920928955078125, 0.254241943359375, 0.3163909912109375, 0.3785400390625, 0.4406890869140625, 0.502838134765625, 0.5649871826171875, 0.62713623046875, 0.6892852783203125, 0.751434326171875, 0.8135833740234375, 0.875732421875, 0.9378814697265625, 1.000030517578125, 1.0621795654296875, 1.12432861328125, 1.1864776611328125, 1.248626708984375, 1.3107757568359375, 1.3729248046875, 1.4350738525390625, 1.497222900390625, 1.5593719482421875, 1.62152099609375, 1.6836700439453125, 1.745819091796875, 1.8079681396484375, 1.8701171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 45.0, 115.0, 242.0, 314.0, 175.0, 56.0, 21.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6863784790039062, -0.6701202392578125, -0.6538619995117188, -0.637603759765625, -0.6213455200195312, -0.6050872802734375, -0.5888290405273438, -0.57257080078125, -0.5563125610351562, -0.5400543212890625, -0.5237960815429688, -0.507537841796875, -0.49127960205078125, -0.4750213623046875, -0.45876312255859375, -0.4425048828125, -0.42624664306640625, -0.4099884033203125, -0.39373016357421875, -0.377471923828125, -0.36121368408203125, -0.3449554443359375, -0.32869720458984375, -0.31243896484375, -0.29618072509765625, -0.2799224853515625, -0.26366424560546875, -0.247406005859375, -0.23114776611328125, -0.2148895263671875, -0.19863128662109375, -0.182373046875, -0.16611480712890625, -0.1498565673828125, -0.13359832763671875, -0.117340087890625, -0.10108184814453125, -0.0848236083984375, -0.06856536865234375, -0.05230712890625, -0.03604888916015625, -0.0197906494140625, -0.00353240966796875, 0.012725830078125, 0.02898406982421875, 0.0452423095703125, 0.06150054931640625, 0.0777587890625, 0.09401702880859375, 0.1102752685546875, 0.12653350830078125, 0.142791748046875, 0.15904998779296875, 0.1753082275390625, 0.19156646728515625, 0.20782470703125, 0.22408294677734375, 0.2403411865234375, 0.25659942626953125, 0.272857666015625, 0.28911590576171875, 0.3053741455078125, 0.32163238525390625, 0.337890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 12.0, 5.0, 11.0, 5.0, 16.0, 14.0, 15.0, 19.0, 23.0, 23.0, 43.0, 73.0, 120.0, 277.0, 863.0, 3136.0, 18032.0, 167766.0, 775208.0, 70466.0, 9394.0, 1907.0, 539.0, 201.0, 103.0, 56.0, 39.0, 19.0, 30.0, 21.0, 19.0, 17.0, 23.0, 9.0, 12.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.1904296875, -1.1567306518554688, -1.1230316162109375, -1.0893325805664062, -1.055633544921875, -1.0219345092773438, -0.9882354736328125, -0.9545364379882812, -0.92083740234375, -0.8871383666992188, -0.8534393310546875, -0.8197402954101562, -0.786041259765625, -0.7523422241210938, -0.7186431884765625, -0.6849441528320312, -0.6512451171875, -0.6175460815429688, -0.5838470458984375, -0.5501480102539062, -0.516448974609375, -0.48274993896484375, -0.4490509033203125, -0.41535186767578125, -0.38165283203125, -0.34795379638671875, -0.3142547607421875, -0.28055572509765625, -0.246856689453125, -0.21315765380859375, -0.1794586181640625, -0.14575958251953125, -0.112060546875, -0.07836151123046875, -0.0446624755859375, -0.01096343994140625, 0.022735595703125, 0.05643463134765625, 0.0901336669921875, 0.12383270263671875, 0.15753173828125, 0.19123077392578125, 0.2249298095703125, 0.25862884521484375, 0.292327880859375, 0.32602691650390625, 0.3597259521484375, 0.39342498779296875, 0.4271240234375, 0.46082305908203125, 0.4945220947265625, 0.5282211303710938, 0.561920166015625, 0.5956192016601562, 0.6293182373046875, 0.6630172729492188, 0.69671630859375, 0.7304153442382812, 0.7641143798828125, 0.7978134155273438, 0.831512451171875, 0.8652114868164062, 0.8989105224609375, 0.9326095581054688, 0.96630859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 10.0, 13.0, 20.0, 15.0, 21.0, 28.0, 26.0, 15.0, 31.0, 37.0, 41.0, 35.0, 44.0, 37.0, 38.0, 45.0, 40.0, 56.0, 53.0, 44.0, 47.0, 37.0, 36.0, 37.0, 26.0, 22.0, 15.0, 22.0, 11.0, 17.0, 13.0, 7.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54296875, -0.5238113403320312, -0.5046539306640625, -0.48549652099609375, -0.466339111328125, -0.44718170166015625, -0.4280242919921875, -0.40886688232421875, -0.38970947265625, -0.37055206298828125, -0.3513946533203125, -0.33223724365234375, -0.313079833984375, -0.29392242431640625, -0.2747650146484375, -0.25560760498046875, -0.2364501953125, -0.21729278564453125, -0.1981353759765625, -0.17897796630859375, -0.159820556640625, -0.14066314697265625, -0.1215057373046875, -0.10234832763671875, -0.08319091796875, -0.06403350830078125, -0.0448760986328125, -0.02571868896484375, -0.006561279296875, 0.01259613037109375, 0.0317535400390625, 0.05091094970703125, 0.070068359375, 0.08922576904296875, 0.1083831787109375, 0.12754058837890625, 0.146697998046875, 0.16585540771484375, 0.1850128173828125, 0.20417022705078125, 0.22332763671875, 0.24248504638671875, 0.2616424560546875, 0.28079986572265625, 0.299957275390625, 0.31911468505859375, 0.3382720947265625, 0.35742950439453125, 0.3765869140625, 0.39574432373046875, 0.4149017333984375, 0.43405914306640625, 0.453216552734375, 0.47237396240234375, 0.4915313720703125, 0.5106887817382812, 0.52984619140625, 0.5490036010742188, 0.5681610107421875, 0.5873184204101562, 0.606475830078125, 0.6256332397460938, 0.6447906494140625, 0.6639480590820312, 0.68310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 15.0, 19.0, 23.0, 53.0, 70.0, 122.0, 285.0, 551.0, 1077.0, 2355.0, 6812.0, 30985.0, 669660.0, 307677.0, 19897.0, 5109.0, 1984.0, 870.0, 386.0, 225.0, 104.0, 76.0, 50.0, 36.0, 23.0, 26.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24158096313476562, -0.23291778564453125, -0.22425460815429688, -0.2155914306640625, -0.20692825317382812, -0.19826507568359375, -0.18960189819335938, -0.180938720703125, -0.17227554321289062, -0.16361236572265625, -0.15494918823242188, -0.1462860107421875, -0.13762283325195312, -0.12895965576171875, -0.12029647827148438, -0.11163330078125, -0.10297012329101562, -0.09430694580078125, -0.08564376831054688, -0.0769805908203125, -0.06831741333007812, -0.05965423583984375, -0.050991058349609375, -0.042327880859375, -0.033664703369140625, -0.02500152587890625, -0.016338348388671875, -0.0076751708984375, 0.000988006591796875, 0.00965118408203125, 0.018314361572265625, 0.0269775390625, 0.035640716552734375, 0.04430389404296875, 0.052967071533203125, 0.0616302490234375, 0.07029342651367188, 0.07895660400390625, 0.08761978149414062, 0.096282958984375, 0.10494613647460938, 0.11360931396484375, 0.12227249145507812, 0.1309356689453125, 0.13959884643554688, 0.14826202392578125, 0.15692520141601562, 0.16558837890625, 0.17425155639648438, 0.18291473388671875, 0.19157791137695312, 0.2002410888671875, 0.20890426635742188, 0.21756744384765625, 0.22623062133789062, 0.234893798828125, 0.24355697631835938, 0.25222015380859375, 0.2608833312988281, 0.2695465087890625, 0.2782096862792969, 0.28687286376953125, 0.2955360412597656, 0.30419921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 13.0, 48.0, 72.0, 134.0, 258.0, 220.0, 132.0, 49.0, 30.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.7913210690021515e-05, -3.672577440738678e-05, -3.5538338124752045e-05, -3.435090184211731e-05, -3.3163465559482574e-05, -3.197602927684784e-05, -3.0788592994213104e-05, -2.960115671157837e-05, -2.8413720428943634e-05, -2.72262841463089e-05, -2.6038847863674164e-05, -2.485141158103943e-05, -2.3663975298404694e-05, -2.247653901576996e-05, -2.1289102733135223e-05, -2.0101666450500488e-05, -1.8914230167865753e-05, -1.7726793885231018e-05, -1.6539357602596283e-05, -1.5351921319961548e-05, -1.4164485037326813e-05, -1.2977048754692078e-05, -1.1789612472057343e-05, -1.0602176189422607e-05, -9.414739906787872e-06, -8.227303624153137e-06, -7.039867341518402e-06, -5.852431058883667e-06, -4.664994776248932e-06, -3.4775584936141968e-06, -2.2901222109794617e-06, -1.1026859283447266e-06, 8.475035429000854e-08, 1.2721866369247437e-06, 2.4596229195594788e-06, 3.647059202194214e-06, 4.834495484828949e-06, 6.021931767463684e-06, 7.209368050098419e-06, 8.396804332733154e-06, 9.58424061536789e-06, 1.0771676898002625e-05, 1.195911318063736e-05, 1.3146549463272095e-05, 1.433398574590683e-05, 1.5521422028541565e-05, 1.67088583111763e-05, 1.7896294593811035e-05, 1.908373087644577e-05, 2.0271167159080505e-05, 2.145860344171524e-05, 2.2646039724349976e-05, 2.383347600698471e-05, 2.5020912289619446e-05, 2.620834857225418e-05, 2.7395784854888916e-05, 2.858322113752365e-05, 2.9770657420158386e-05, 3.095809370279312e-05, 3.2145529985427856e-05, 3.333296626806259e-05, 3.452040255069733e-05, 3.570783883333206e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 7.0, 16.0, 28.0, 53.0, 130.0, 386.0, 1778.0, 26249.0, 999757.0, 18079.0, 1482.0, 367.0, 110.0, 48.0, 21.0, 9.0, 9.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.680511474609375, -0.65887451171875, -0.637237548828125, -0.6156005859375, -0.593963623046875, -0.57232666015625, -0.550689697265625, -0.529052734375, -0.507415771484375, -0.48577880859375, -0.464141845703125, -0.4425048828125, -0.420867919921875, -0.39923095703125, -0.377593994140625, -0.35595703125, -0.334320068359375, -0.31268310546875, -0.291046142578125, -0.2694091796875, -0.247772216796875, -0.22613525390625, -0.204498291015625, -0.182861328125, -0.161224365234375, -0.13958740234375, -0.117950439453125, -0.0963134765625, -0.074676513671875, -0.05303955078125, -0.031402587890625, -0.009765625, 0.011871337890625, 0.03350830078125, 0.055145263671875, 0.0767822265625, 0.098419189453125, 0.12005615234375, 0.141693115234375, 0.163330078125, 0.184967041015625, 0.20660400390625, 0.228240966796875, 0.2498779296875, 0.271514892578125, 0.29315185546875, 0.314788818359375, 0.33642578125, 0.358062744140625, 0.37969970703125, 0.401336669921875, 0.4229736328125, 0.444610595703125, 0.46624755859375, 0.487884521484375, 0.509521484375, 0.531158447265625, 0.55279541015625, 0.574432373046875, 0.5960693359375, 0.617706298828125, 0.63934326171875, 0.660980224609375, 0.6826171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 3.0, 10.0, 9.0, 18.0, 50.0, 88.0, 167.0, 236.0, 163.0, 99.0, 54.0, 41.0, 18.0, 11.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3567466735839844, -0.34508514404296875, -0.3334236145019531, -0.3217620849609375, -0.3101005554199219, -0.29843902587890625, -0.2867774963378906, -0.275115966796875, -0.2634544372558594, -0.25179290771484375, -0.24013137817382812, -0.2284698486328125, -0.21680831909179688, -0.20514678955078125, -0.19348526000976562, -0.18182373046875, -0.17016220092773438, -0.15850067138671875, -0.14683914184570312, -0.1351776123046875, -0.12351608276367188, -0.11185455322265625, -0.10019302368164062, -0.088531494140625, -0.07686996459960938, -0.06520843505859375, -0.053546905517578125, -0.0418853759765625, -0.030223846435546875, -0.01856231689453125, -0.006900787353515625, 0.0047607421875, 0.016422271728515625, 0.02808380126953125, 0.039745330810546875, 0.0514068603515625, 0.06306838989257812, 0.07472991943359375, 0.08639144897460938, 0.098052978515625, 0.10971450805664062, 0.12137603759765625, 0.13303756713867188, 0.1446990966796875, 0.15636062622070312, 0.16802215576171875, 0.17968368530273438, 0.19134521484375, 0.20300674438476562, 0.21466827392578125, 0.22632980346679688, 0.2379913330078125, 0.24965286254882812, 0.26131439208984375, 0.2729759216308594, 0.284637451171875, 0.2962989807128906, 0.30796051025390625, 0.3196220397949219, 0.3312835693359375, 0.3429450988769531, 0.35460662841796875, 0.3662681579589844, 0.3779296875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 20.0, 52.0, 160.0, 442.0, 200.0, 79.0, 23.0, 17.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.938676834106445, -5.698006629943848, -5.45733642578125, -5.216666221618652, -4.975996017456055, -4.735325813293457, -4.494655609130859, -4.253985404968262, -4.013315200805664, -3.7726449966430664, -3.5319747924804688, -3.291304588317871, -3.0506343841552734, -2.809964179992676, -2.5692942142486572, -2.3286240100860596, -2.087954044342041, -1.8472838401794434, -1.6066136360168457, -1.3659435510635376, -1.12527334690094, -0.8846031427383423, -0.6439330577850342, -0.4032628536224365, -0.16259264945983887, 0.0780775249004364, 0.31874769926071167, 0.5594178438186646, 0.8000880479812622, 1.0407582521438599, 1.281428337097168, 1.5220985412597656, 1.7627687454223633, 2.003438949584961, 2.2441091537475586, 2.4847793579101562, 2.725449562072754, 2.9661197662353516, 3.20678973197937, 3.4474599361419678, 3.6881301403045654, 3.928800344467163, 4.169470310211182, 4.410140514373779, 4.650810718536377, 4.891480922698975, 5.132151126861572, 5.37282133102417, 5.613491535186768, 5.854161739349365, 6.094831943511963, 6.3355021476745605, 6.576172351837158, 6.816842555999756, 7.057512283325195, 7.298182487487793, 7.538852691650391, 7.779522895812988, 8.020193099975586, 8.260863304138184, 8.501533508300781, 8.742203712463379, 8.982873916625977, 9.223544120788574, 9.464214324951172]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 9.0, 14.0, 15.0, 15.0, 21.0, 22.0, 31.0, 37.0, 34.0, 57.0, 60.0, 62.0, 65.0, 84.0, 69.0, 51.0, 66.0, 61.0, 47.0, 44.0, 25.0, 33.0, 20.0, 15.0, 15.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.111644744873047, -3.957146167755127, -3.802647590637207, -3.648149013519287, -3.493650197982788, -3.339151620864868, -3.1846530437469482, -3.030154228210449, -2.8756556510925293, -2.7211570739746094, -2.5666584968566895, -2.4121599197387695, -2.2576611042022705, -2.1031625270843506, -1.9486639499664307, -1.7941652536392212, -1.6396667957305908, -1.485168218612671, -1.3306695222854614, -1.1761709451675415, -1.021672248840332, -0.8671736717224121, -0.7126750946044922, -0.5581763982772827, -0.4036778211593628, -0.2491791993379593, -0.09468057751655579, 0.05981802940368652, 0.21431666612625122, 0.3688153028488159, 0.5233138799667358, 0.6778125762939453, 0.8323111534118652, 0.9868097901344299, 1.1413084268569946, 1.2958070039749146, 1.450305700302124, 1.604804277420044, 1.7593028545379639, 1.9138015508651733, 2.068300247192383, 2.2227988243103027, 2.3772974014282227, 2.5317959785461426, 2.6862947940826416, 2.8407933712005615, 2.9952919483184814, 3.1497907638549805, 3.3042891025543213, 3.458787679672241, 3.613286256790161, 3.76778507232666, 3.92228364944458, 4.0767822265625, 4.23128080368042, 4.38577938079834, 4.54027795791626, 4.69477653503418, 4.8492751121521, 5.0037736892700195, 5.1582722663879395, 5.312770843505859, 5.4672698974609375, 5.621768474578857, 5.776267051696777]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 22.0, 42.0, 150.0, 643.0, 302639.0, 3889996.0, 546.0, 130.0, 45.0, 15.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -6.032196044921875, -5.88861083984375, -5.745025634765625, -5.6014404296875, -5.457855224609375, -5.31427001953125, -5.170684814453125, -5.027099609375, -4.883514404296875, -4.73992919921875, -4.596343994140625, -4.4527587890625, -4.309173583984375, -4.16558837890625, -4.022003173828125, -3.87841796875, -3.734832763671875, -3.59124755859375, -3.447662353515625, -3.3040771484375, -3.160491943359375, -3.01690673828125, -2.873321533203125, -2.729736328125, -2.586151123046875, -2.44256591796875, -2.298980712890625, -2.1553955078125, -2.011810302734375, -1.86822509765625, -1.724639892578125, -1.5810546875, -1.437469482421875, -1.29388427734375, -1.150299072265625, -1.0067138671875, -0.863128662109375, -0.71954345703125, -0.575958251953125, -0.432373046875, -0.288787841796875, -0.14520263671875, -0.001617431640625, 0.1419677734375, 0.285552978515625, 0.42913818359375, 0.572723388671875, 0.71630859375, 0.859893798828125, 1.00347900390625, 1.147064208984375, 1.2906494140625, 1.434234619140625, 1.57781982421875, 1.721405029296875, 1.864990234375, 2.008575439453125, 2.15216064453125, 2.295745849609375, 2.4393310546875, 2.582916259765625, 2.72650146484375, 2.870086669921875, 3.013671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 15.0, 36.0, 115.0, 197.0, 290.0, 207.0, 79.0, 33.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71630859375, -0.6998023986816406, -0.6832962036132812, -0.6667900085449219, -0.6502838134765625, -0.6337776184082031, -0.6172714233398438, -0.6007652282714844, -0.584259033203125, -0.5677528381347656, -0.5512466430664062, -0.5347404479980469, -0.5182342529296875, -0.5017280578613281, -0.48522186279296875, -0.4687156677246094, -0.45220947265625, -0.4357032775878906, -0.41919708251953125, -0.4026908874511719, -0.3861846923828125, -0.3696784973144531, -0.35317230224609375, -0.3366661071777344, -0.320159912109375, -0.3036537170410156, -0.28714752197265625, -0.2706413269042969, -0.2541351318359375, -0.23762893676757812, -0.22112274169921875, -0.20461654663085938, -0.1881103515625, -0.17160415649414062, -0.15509796142578125, -0.13859176635742188, -0.1220855712890625, -0.10557937622070312, -0.08907318115234375, -0.07256698608398438, -0.056060791015625, -0.039554595947265625, -0.02304840087890625, -0.006542205810546875, 0.0099639892578125, 0.026470184326171875, 0.04297637939453125, 0.059482574462890625, 0.07598876953125, 0.09249496459960938, 0.10900115966796875, 0.12550735473632812, 0.1420135498046875, 0.15851974487304688, 0.17502593994140625, 0.19153213500976562, 0.208038330078125, 0.22454452514648438, 0.24105072021484375, 0.2575569152832031, 0.2740631103515625, 0.2905693054199219, 0.30707550048828125, 0.3235816955566406, 0.340087890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 17.0, 37.0, 48.0, 114.0, 188.0, 458.0, 1188.0, 4644.0, 32358.0, 4081709.0, 64205.0, 6761.0, 1619.0, 504.0, 202.0, 112.0, 45.0, 21.0, 9.0, 11.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5614242553710938, -0.5354461669921875, -0.5094680786132812, -0.483489990234375, -0.45751190185546875, -0.4315338134765625, -0.40555572509765625, -0.37957763671875, -0.35359954833984375, -0.3276214599609375, -0.30164337158203125, -0.275665283203125, -0.24968719482421875, -0.2237091064453125, -0.19773101806640625, -0.1717529296875, -0.14577484130859375, -0.1197967529296875, -0.09381866455078125, -0.067840576171875, -0.04186248779296875, -0.0158843994140625, 0.01009368896484375, 0.03607177734375, 0.06204986572265625, 0.0880279541015625, 0.11400604248046875, 0.139984130859375, 0.16596221923828125, 0.1919403076171875, 0.21791839599609375, 0.243896484375, 0.26987457275390625, 0.2958526611328125, 0.32183074951171875, 0.347808837890625, 0.37378692626953125, 0.3997650146484375, 0.42574310302734375, 0.45172119140625, 0.47769927978515625, 0.5036773681640625, 0.5296554565429688, 0.555633544921875, 0.5816116333007812, 0.6075897216796875, 0.6335678100585938, 0.6595458984375, 0.6855239868164062, 0.7115020751953125, 0.7374801635742188, 0.763458251953125, 0.7894363403320312, 0.8154144287109375, 0.8413925170898438, 0.86737060546875, 0.8933486938476562, 0.9193267822265625, 0.9453048706054688, 0.971282958984375, 0.9972610473632812, 1.0232391357421875, 1.0492172241210938, 1.0751953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 14.0, 22.0, 48.0, 122.0, 497.0, 3038.0, 175.0, 44.0, 23.0, 23.0, 19.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3095703125, -0.301025390625, -0.29248046875, -0.283935546875, -0.275390625, -0.266845703125, -0.25830078125, -0.249755859375, -0.2412109375, -0.232666015625, -0.22412109375, -0.215576171875, -0.20703125, -0.198486328125, -0.18994140625, -0.181396484375, -0.1728515625, -0.164306640625, -0.15576171875, -0.147216796875, -0.138671875, -0.130126953125, -0.12158203125, -0.113037109375, -0.1044921875, -0.095947265625, -0.08740234375, -0.078857421875, -0.0703125, -0.061767578125, -0.05322265625, -0.044677734375, -0.0361328125, -0.027587890625, -0.01904296875, -0.010498046875, -0.001953125, 0.006591796875, 0.01513671875, 0.023681640625, 0.0322265625, 0.040771484375, 0.04931640625, 0.057861328125, 0.06640625, 0.074951171875, 0.08349609375, 0.092041015625, 0.1005859375, 0.109130859375, 0.11767578125, 0.126220703125, 0.134765625, 0.143310546875, 0.15185546875, 0.160400390625, 0.1689453125, 0.177490234375, 0.18603515625, 0.194580078125, 0.203125, 0.211669921875, 0.22021484375, 0.228759765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 33.0, 147.0, 533.0, 241.0, 41.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.640495777130127, -3.567335605621338, -3.494175434112549, -3.4210152626037598, -3.3478550910949707, -3.2746951580047607, -3.2015349864959717, -3.1283748149871826, -3.0552146434783936, -2.9820544719696045, -2.9088943004608154, -2.8357341289520264, -2.7625741958618164, -2.6894140243530273, -2.6162538528442383, -2.543093681335449, -2.46993350982666, -2.396773338317871, -2.323613166809082, -2.250452995300293, -2.177292823791504, -2.104132890701294, -2.030972719192505, -1.9578125476837158, -1.8846523761749268, -1.8114922046661377, -1.7383320331573486, -1.6651719808578491, -1.59201180934906, -1.518851637840271, -1.4456915855407715, -1.3725314140319824, -1.2993710041046143, -1.2262108325958252, -1.1530506610870361, -1.0798906087875366, -1.0067304372787476, -0.9335702657699585, -0.8604101538658142, -0.7872500419616699, -0.7140898704528809, -0.6409296989440918, -0.5677695870399475, -0.49460944533348083, -0.42144930362701416, -0.3482891619205475, -0.2751290202140808, -0.20196890830993652, -0.12880873680114746, -0.055648595094680786, 0.01751154661178589, 0.09067168831825256, 0.16383183002471924, 0.2369919717311859, 0.3101521134376526, 0.3833122253417969, 0.45647239685058594, 0.529632568359375, 0.6027926802635193, 0.6759527921676636, 0.7491129636764526, 0.8222731351852417, 0.895433247089386, 0.9685933589935303, 1.0417535305023193]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 7.0, 11.0, 18.0, 15.0, 29.0, 32.0, 26.0, 44.0, 64.0, 55.0, 60.0, 50.0, 48.0, 51.0, 69.0, 51.0, 56.0, 64.0, 48.0, 40.0, 40.0, 30.0, 32.0, 18.0, 10.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8985940217971802, -0.8755716681480408, -0.8525493144989014, -0.8295270204544067, -0.8065046668052673, -0.7834823131561279, -0.7604599595069885, -0.7374376058578491, -0.7144153118133545, -0.6913929581642151, -0.6683706045150757, -0.645348310470581, -0.6223259568214417, -0.5993036031723022, -0.5762812495231628, -0.5532588958740234, -0.530236542224884, -0.5072141885757446, -0.4841918647289276, -0.4611695110797882, -0.4381471872329712, -0.4151248335838318, -0.3921024799346924, -0.369080126285553, -0.34605780243873596, -0.32303544878959656, -0.30001312494277954, -0.27699077129364014, -0.25396841764450073, -0.23094609379768372, -0.2079237401485443, -0.1849014014005661, -0.16187900304794312, -0.1388566642999649, -0.1158343181014061, -0.09281197190284729, -0.06978963315486908, -0.04676729440689087, -0.023744940757751465, -0.0007226020097732544, 0.022299736738204956, 0.045322079211473465, 0.06834442168474197, 0.09136676788330078, 0.11438910663127899, 0.1374114453792572, 0.1604337990283966, 0.18345613777637482, 0.20647847652435303, 0.22950081527233124, 0.25252315402030945, 0.27554550766944885, 0.29856783151626587, 0.3215901851654053, 0.3446125388145447, 0.3676348924636841, 0.3906572163105011, 0.4136795699596405, 0.4367018938064575, 0.4597242474555969, 0.48274660110473633, 0.505768895149231, 0.5287913084030151, 0.5518136024475098, 0.5748359560966492]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 12.0, 19.0, 30.0, 46.0, 64.0, 72.0, 123.0, 246.0, 477.0, 1053.0, 2690.0, 14797.0, 835382.0, 182714.0, 7199.0, 1906.0, 772.0, 389.0, 192.0, 109.0, 55.0, 33.0, 46.0, 23.0, 21.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.189453125, -2.122772216796875, -2.05609130859375, -1.989410400390625, -1.9227294921875, -1.856048583984375, -1.78936767578125, -1.722686767578125, -1.656005859375, -1.589324951171875, -1.52264404296875, -1.455963134765625, -1.3892822265625, -1.322601318359375, -1.25592041015625, -1.189239501953125, -1.12255859375, -1.055877685546875, -0.98919677734375, -0.922515869140625, -0.8558349609375, -0.789154052734375, -0.72247314453125, -0.655792236328125, -0.589111328125, -0.522430419921875, -0.45574951171875, -0.389068603515625, -0.3223876953125, -0.255706787109375, -0.18902587890625, -0.122344970703125, -0.0556640625, 0.011016845703125, 0.07769775390625, 0.144378662109375, 0.2110595703125, 0.277740478515625, 0.34442138671875, 0.411102294921875, 0.477783203125, 0.544464111328125, 0.61114501953125, 0.677825927734375, 0.7445068359375, 0.811187744140625, 0.87786865234375, 0.944549560546875, 1.01123046875, 1.077911376953125, 1.14459228515625, 1.211273193359375, 1.2779541015625, 1.344635009765625, 1.41131591796875, 1.477996826171875, 1.544677734375, 1.611358642578125, 1.67803955078125, 1.744720458984375, 1.8114013671875, 1.878082275390625, 1.94476318359375, 2.011444091796875, 2.078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 16.0, 44.0, 125.0, 229.0, 258.0, 196.0, 71.0, 35.0, 8.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6945114135742188, -0.6780853271484375, -0.6616592407226562, -0.645233154296875, -0.6288070678710938, -0.6123809814453125, -0.5959548950195312, -0.57952880859375, -0.5631027221679688, -0.5466766357421875, -0.5302505493164062, -0.513824462890625, -0.49739837646484375, -0.4809722900390625, -0.46454620361328125, -0.4481201171875, -0.43169403076171875, -0.4152679443359375, -0.39884185791015625, -0.382415771484375, -0.36598968505859375, -0.3495635986328125, -0.33313751220703125, -0.31671142578125, -0.30028533935546875, -0.2838592529296875, -0.26743316650390625, -0.251007080078125, -0.23458099365234375, -0.2181549072265625, -0.20172882080078125, -0.185302734375, -0.16887664794921875, -0.1524505615234375, -0.13602447509765625, -0.119598388671875, -0.10317230224609375, -0.0867462158203125, -0.07032012939453125, -0.05389404296875, -0.03746795654296875, -0.0210418701171875, -0.00461578369140625, 0.011810302734375, 0.02823638916015625, 0.0446624755859375, 0.06108856201171875, 0.0775146484375, 0.09394073486328125, 0.1103668212890625, 0.12679290771484375, 0.143218994140625, 0.15964508056640625, 0.1760711669921875, 0.19249725341796875, 0.20892333984375, 0.22534942626953125, 0.2417755126953125, 0.25820159912109375, 0.274627685546875, 0.29105377197265625, 0.3074798583984375, 0.32390594482421875, 0.34033203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 12.0, 15.0, 22.0, 25.0, 27.0, 25.0, 50.0, 52.0, 115.0, 255.0, 737.0, 2519.0, 13124.0, 110679.0, 804216.0, 100729.0, 12228.0, 2378.0, 682.0, 252.0, 121.0, 56.0, 48.0, 29.0, 23.0, 23.0, 17.0, 12.0, 15.0, 9.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2626953125, -1.22607421875, -1.189453125, -1.15283203125, -1.1162109375, -1.07958984375, -1.04296875, -1.00634765625, -0.9697265625, -0.93310546875, -0.896484375, -0.85986328125, -0.8232421875, -0.78662109375, -0.75, -0.71337890625, -0.6767578125, -0.64013671875, -0.603515625, -0.56689453125, -0.5302734375, -0.49365234375, -0.45703125, -0.42041015625, -0.3837890625, -0.34716796875, -0.310546875, -0.27392578125, -0.2373046875, -0.20068359375, -0.1640625, -0.12744140625, -0.0908203125, -0.05419921875, -0.017578125, 0.01904296875, 0.0556640625, 0.09228515625, 0.12890625, 0.16552734375, 0.2021484375, 0.23876953125, 0.275390625, 0.31201171875, 0.3486328125, 0.38525390625, 0.421875, 0.45849609375, 0.4951171875, 0.53173828125, 0.568359375, 0.60498046875, 0.6416015625, 0.67822265625, 0.71484375, 0.75146484375, 0.7880859375, 0.82470703125, 0.861328125, 0.89794921875, 0.9345703125, 0.97119140625, 1.0078125, 1.04443359375, 1.0810546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 16.0, 11.0, 19.0, 21.0, 22.0, 27.0, 35.0, 34.0, 37.0, 36.0, 41.0, 44.0, 54.0, 44.0, 56.0, 56.0, 48.0, 52.0, 31.0, 44.0, 33.0, 32.0, 31.0, 17.0, 35.0, 17.0, 17.0, 16.0, 13.0, 8.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6008453369140625, -0.579620361328125, -0.5583953857421875, -0.53717041015625, -0.5159454345703125, -0.494720458984375, -0.4734954833984375, -0.4522705078125, -0.4310455322265625, -0.409820556640625, -0.3885955810546875, -0.36737060546875, -0.3461456298828125, -0.324920654296875, -0.3036956787109375, -0.282470703125, -0.2612457275390625, -0.240020751953125, -0.2187957763671875, -0.19757080078125, -0.1763458251953125, -0.155120849609375, -0.1338958740234375, -0.1126708984375, -0.0914459228515625, -0.070220947265625, -0.0489959716796875, -0.02777099609375, -0.0065460205078125, 0.014678955078125, 0.0359039306640625, 0.05712890625, 0.0783538818359375, 0.099578857421875, 0.1208038330078125, 0.14202880859375, 0.1632537841796875, 0.184478759765625, 0.2057037353515625, 0.2269287109375, 0.2481536865234375, 0.269378662109375, 0.2906036376953125, 0.31182861328125, 0.3330535888671875, 0.354278564453125, 0.3755035400390625, 0.396728515625, 0.4179534912109375, 0.439178466796875, 0.4604034423828125, 0.48162841796875, 0.5028533935546875, 0.524078369140625, 0.5453033447265625, 0.5665283203125, 0.5877532958984375, 0.608978271484375, 0.6302032470703125, 0.65142822265625, 0.6726531982421875, 0.693878173828125, 0.7151031494140625, 0.736328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 18.0, 22.0, 37.0, 52.0, 78.0, 158.0, 244.0, 533.0, 1176.0, 3359.0, 13484.0, 92631.0, 770763.0, 141505.0, 17625.0, 4168.0, 1396.0, 577.0, 291.0, 139.0, 102.0, 64.0, 32.0, 31.0, 13.0, 7.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2410888671875, -0.23320579528808594, -0.22532272338867188, -0.2174396514892578, -0.20955657958984375, -0.2016735076904297, -0.19379043579101562, -0.18590736389160156, -0.1780242919921875, -0.17014122009277344, -0.16225814819335938, -0.1543750762939453, -0.14649200439453125, -0.1386089324951172, -0.13072586059570312, -0.12284278869628906, -0.114959716796875, -0.10707664489746094, -0.09919357299804688, -0.09131050109863281, -0.08342742919921875, -0.07554435729980469, -0.06766128540039062, -0.05977821350097656, -0.0518951416015625, -0.04401206970214844, -0.036128997802734375, -0.028245925903320312, -0.02036285400390625, -0.012479782104492188, -0.004596710205078125, 0.0032863616943359375, 0.01116943359375, 0.019052505493164062, 0.026935577392578125, 0.03481864929199219, 0.04270172119140625, 0.05058479309082031, 0.058467864990234375, 0.06635093688964844, 0.0742340087890625, 0.08211708068847656, 0.09000015258789062, 0.09788322448730469, 0.10576629638671875, 0.11364936828613281, 0.12153244018554688, 0.12941551208496094, 0.137298583984375, 0.14518165588378906, 0.15306472778320312, 0.1609477996826172, 0.16883087158203125, 0.1767139434814453, 0.18459701538085938, 0.19248008728027344, 0.2003631591796875, 0.20824623107910156, 0.21612930297851562, 0.2240123748779297, 0.23189544677734375, 0.2397785186767578, 0.24766159057617188, 0.25554466247558594, 0.263427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 7.0, 15.0, 33.0, 35.0, 53.0, 88.0, 112.0, 161.0, 118.0, 124.0, 89.0, 57.0, 30.0, 22.0, 11.0, 9.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.297494888305664e-05, -4.209205508232117e-05, -4.120916128158569e-05, -4.032626748085022e-05, -3.9443373680114746e-05, -3.856047987937927e-05, -3.76775860786438e-05, -3.6794692277908325e-05, -3.591179847717285e-05, -3.502890467643738e-05, -3.4146010875701904e-05, -3.326311707496643e-05, -3.238022327423096e-05, -3.1497329473495483e-05, -3.061443567276001e-05, -2.9731541872024536e-05, -2.8848648071289062e-05, -2.796575427055359e-05, -2.7082860469818115e-05, -2.619996666908264e-05, -2.5317072868347168e-05, -2.4434179067611694e-05, -2.355128526687622e-05, -2.2668391466140747e-05, -2.1785497665405273e-05, -2.09026038646698e-05, -2.0019710063934326e-05, -1.9136816263198853e-05, -1.825392246246338e-05, -1.7371028661727905e-05, -1.648813486099243e-05, -1.5605241060256958e-05, -1.4722347259521484e-05, -1.383945345878601e-05, -1.2956559658050537e-05, -1.2073665857315063e-05, -1.119077205657959e-05, -1.0307878255844116e-05, -9.424984455108643e-06, -8.542090654373169e-06, -7.659196853637695e-06, -6.776303052902222e-06, -5.893409252166748e-06, -5.010515451431274e-06, -4.127621650695801e-06, -3.244727849960327e-06, -2.3618340492248535e-06, -1.4789402484893799e-06, -5.960464477539062e-07, 2.868473529815674e-07, 1.169741153717041e-06, 2.0526349544525146e-06, 2.9355287551879883e-06, 3.818422555923462e-06, 4.7013163566589355e-06, 5.584210157394409e-06, 6.467103958129883e-06, 7.3499977588653564e-06, 8.23289155960083e-06, 9.115785360336304e-06, 9.998679161071777e-06, 1.0881572961807251e-05, 1.1764466762542725e-05, 1.2647360563278198e-05, 1.3530254364013672e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 2.0, 11.0, 6.0, 12.0, 15.0, 12.0, 23.0, 42.0, 71.0, 111.0, 282.0, 625.0, 2113.0, 10111.0, 83117.0, 840726.0, 96757.0, 10901.0, 2323.0, 673.0, 251.0, 123.0, 69.0, 36.0, 20.0, 23.0, 19.0, 12.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.25615692138671875, -0.2471771240234375, -0.23819732666015625, -0.229217529296875, -0.22023773193359375, -0.2112579345703125, -0.20227813720703125, -0.19329833984375, -0.18431854248046875, -0.1753387451171875, -0.16635894775390625, -0.157379150390625, -0.14839935302734375, -0.1394195556640625, -0.13043975830078125, -0.1214599609375, -0.11248016357421875, -0.1035003662109375, -0.09452056884765625, -0.085540771484375, -0.07656097412109375, -0.0675811767578125, -0.05860137939453125, -0.04962158203125, -0.04064178466796875, -0.0316619873046875, -0.02268218994140625, -0.013702392578125, -0.00472259521484375, 0.0042572021484375, 0.01323699951171875, 0.022216796875, 0.03119659423828125, 0.0401763916015625, 0.04915618896484375, 0.058135986328125, 0.06711578369140625, 0.0760955810546875, 0.08507537841796875, 0.09405517578125, 0.10303497314453125, 0.1120147705078125, 0.12099456787109375, 0.129974365234375, 0.13895416259765625, 0.1479339599609375, 0.15691375732421875, 0.1658935546875, 0.17487335205078125, 0.1838531494140625, 0.19283294677734375, 0.201812744140625, 0.21079254150390625, 0.2197723388671875, 0.22875213623046875, 0.23773193359375, 0.24671173095703125, 0.2556915283203125, 0.26467132568359375, 0.273651123046875, 0.28263092041015625, 0.2916107177734375, 0.30059051513671875, 0.3095703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 5.0, 8.0, 13.0, 15.0, 12.0, 15.0, 26.0, 23.0, 39.0, 32.0, 65.0, 81.0, 76.0, 81.0, 72.0, 68.0, 55.0, 54.0, 47.0, 42.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 11.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1651611328125, -0.16042709350585938, -0.15569305419921875, -0.15095901489257812, -0.1462249755859375, -0.14149093627929688, -0.13675689697265625, -0.13202285766601562, -0.127288818359375, -0.12255477905273438, -0.11782073974609375, -0.11308670043945312, -0.1083526611328125, -0.10361862182617188, -0.09888458251953125, -0.09415054321289062, -0.08941650390625, -0.08468246459960938, -0.07994842529296875, -0.07521438598632812, -0.0704803466796875, -0.06574630737304688, -0.06101226806640625, -0.056278228759765625, -0.051544189453125, -0.046810150146484375, -0.04207611083984375, -0.037342071533203125, -0.0326080322265625, -0.027873992919921875, -0.02313995361328125, -0.018405914306640625, -0.013671875, -0.008937835693359375, -0.00420379638671875, 0.000530242919921875, 0.0052642822265625, 0.009998321533203125, 0.01473236083984375, 0.019466400146484375, 0.024200439453125, 0.028934478759765625, 0.03366851806640625, 0.038402557373046875, 0.0431365966796875, 0.047870635986328125, 0.05260467529296875, 0.057338714599609375, 0.06207275390625, 0.06680679321289062, 0.07154083251953125, 0.07627487182617188, 0.0810089111328125, 0.08574295043945312, 0.09047698974609375, 0.09521102905273438, 0.099945068359375, 0.10467910766601562, 0.10941314697265625, 0.11414718627929688, 0.1188812255859375, 0.12361526489257812, 0.12834930419921875, 0.13308334350585938, 0.1378173828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 18.0, 50.0, 187.0, 503.0, 171.0, 49.0, 16.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.74199104309082, -16.41053009033203, -16.079071044921875, -15.747610092163086, -15.416150093078613, -15.08469009399414, -14.753229141235352, -14.421769142150879, -14.090309143066406, -13.758849143981934, -13.427389144897461, -13.095928192138672, -12.7644681930542, -12.433008193969727, -12.101547241210938, -11.770087242126465, -11.438627243041992, -11.10716724395752, -10.775707244873047, -10.444246292114258, -10.112786293029785, -9.781326293945312, -9.449865341186523, -9.11840534210205, -8.786945343017578, -8.455485343933105, -8.124025344848633, -7.792564392089844, -7.461104393005371, -7.129644393920898, -6.798183917999268, -6.466723442077637, -6.135263442993164, -5.803803443908691, -5.4723429679870605, -5.14088249206543, -4.809422492980957, -4.477962493896484, -4.1465020179748535, -3.8150417804718018, -3.48358154296875, -3.1521213054656982, -2.8206610679626465, -2.4892008304595947, -2.157740592956543, -1.8262803554534912, -1.4948201179504395, -1.1633598804473877, -0.8318996429443359, -0.5004394054412842, -0.16897916793823242, 0.16248106956481934, 0.4939413070678711, 0.8254015445709229, 1.1568617820739746, 1.4883220195770264, 1.8197822570800781, 2.15124249458313, 2.4827027320861816, 2.8141629695892334, 3.145623207092285, 3.477083444595337, 3.8085436820983887, 4.1400041580200195, 4.471464157104492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 5.0, 8.0, 8.0, 12.0, 15.0, 15.0, 22.0, 24.0, 32.0, 39.0, 37.0, 34.0, 28.0, 46.0, 45.0, 35.0, 44.0, 51.0, 52.0, 42.0, 44.0, 46.0, 35.0, 31.0, 36.0, 35.0, 34.0, 23.0, 23.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.852600574493408, -3.736675262451172, -3.6207501888275146, -3.5048248767852783, -3.388899803161621, -3.2729744911193848, -3.1570494174957275, -3.041124105453491, -2.925199031829834, -2.8092737197875977, -2.6933486461639404, -2.577423334121704, -2.461498260498047, -2.3455729484558105, -2.2296478748321533, -2.113722562789917, -1.9977973699569702, -1.8818721771240234, -1.7659469842910767, -1.6500217914581299, -1.534096598625183, -1.4181714057922363, -1.30224609375, -1.1863210201263428, -1.0703957080841064, -0.9544705152511597, -0.8385453224182129, -0.7226201295852661, -0.6066949367523193, -0.4907696843147278, -0.374844491481781, -0.25891929864883423, -0.14299416542053223, -0.027068965137004852, 0.08885623514652252, 0.2047814428806305, 0.32070663571357727, 0.43663185834884644, 0.5525570511817932, 0.66848224401474, 0.7844074368476868, 0.9003326296806335, 1.016257882118225, 1.1321830749511719, 1.2481082677841187, 1.3640334606170654, 1.4799586534500122, 1.595883846282959, 1.7118090391159058, 1.8277342319488525, 1.9436594247817993, 2.059584617614746, 2.1755099296569824, 2.2914350032806396, 2.407360315322876, 2.523285388946533, 2.6392107009887695, 2.755136013031006, 2.871061086654663, 2.9869863986968994, 3.1029114723205566, 3.218836784362793, 3.33476185798645, 3.4506871700286865, 3.5666122436523438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 15.0, 12.0, 13.0, 25.0, 43.0, 79.0, 242.0, 928.0, 7104.0, 4179547.0, 5250.0, 702.0, 165.0, 54.0, 35.0, 23.0, 15.0, 7.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.5863037109375, -5.457763671875, -5.3292236328125, -5.20068359375, -5.0721435546875, -4.943603515625, -4.8150634765625, -4.6865234375, -4.5579833984375, -4.429443359375, -4.3009033203125, -4.17236328125, -4.0438232421875, -3.915283203125, -3.7867431640625, -3.658203125, -3.5296630859375, -3.401123046875, -3.2725830078125, -3.14404296875, -3.0155029296875, -2.886962890625, -2.7584228515625, -2.6298828125, -2.5013427734375, -2.372802734375, -2.2442626953125, -2.11572265625, -1.9871826171875, -1.858642578125, -1.7301025390625, -1.6015625, -1.4730224609375, -1.344482421875, -1.2159423828125, -1.08740234375, -0.9588623046875, -0.830322265625, -0.7017822265625, -0.5732421875, -0.4447021484375, -0.316162109375, -0.1876220703125, -0.05908203125, 0.0694580078125, 0.197998046875, 0.3265380859375, 0.455078125, 0.5836181640625, 0.712158203125, 0.8406982421875, 0.96923828125, 1.0977783203125, 1.226318359375, 1.3548583984375, 1.4833984375, 1.6119384765625, 1.740478515625, 1.8690185546875, 1.99755859375, 2.1260986328125, 2.254638671875, 2.3831787109375, 2.51171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 21.0, 72.0, 107.0, 191.0, 241.0, 168.0, 114.0, 39.0, 20.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7240219116210938, -0.7073211669921875, -0.6906204223632812, -0.673919677734375, -0.6572189331054688, -0.6405181884765625, -0.6238174438476562, -0.60711669921875, -0.5904159545898438, -0.5737152099609375, -0.5570144653320312, -0.540313720703125, -0.5236129760742188, -0.5069122314453125, -0.49021148681640625, -0.4735107421875, -0.45680999755859375, -0.4401092529296875, -0.42340850830078125, -0.406707763671875, -0.39000701904296875, -0.3733062744140625, -0.35660552978515625, -0.33990478515625, -0.32320404052734375, -0.3065032958984375, -0.28980255126953125, -0.273101806640625, -0.25640106201171875, -0.2397003173828125, -0.22299957275390625, -0.206298828125, -0.18959808349609375, -0.1728973388671875, -0.15619659423828125, -0.139495849609375, -0.12279510498046875, -0.1060943603515625, -0.08939361572265625, -0.07269287109375, -0.05599212646484375, -0.0392913818359375, -0.02259063720703125, -0.005889892578125, 0.01081085205078125, 0.0275115966796875, 0.04421234130859375, 0.0609130859375, 0.07761383056640625, 0.0943145751953125, 0.11101531982421875, 0.127716064453125, 0.14441680908203125, 0.1611175537109375, 0.17781829833984375, 0.19451904296875, 0.21121978759765625, 0.2279205322265625, 0.24462127685546875, 0.261322021484375, 0.27802276611328125, 0.2947235107421875, 0.31142425537109375, 0.328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 14.0, 14.0, 25.0, 56.0, 113.0, 243.0, 527.0, 1504.0, 5411.0, 39492.0, 4048861.0, 86290.0, 8116.0, 2161.0, 785.0, 316.0, 160.0, 77.0, 36.0, 36.0, 16.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.548828125, -1.5107040405273438, -1.4725799560546875, -1.4344558715820312, -1.396331787109375, -1.3582077026367188, -1.3200836181640625, -1.2819595336914062, -1.24383544921875, -1.2057113647460938, -1.1675872802734375, -1.1294631958007812, -1.091339111328125, -1.0532150268554688, -1.0150909423828125, -0.9769668579101562, -0.9388427734375, -0.9007186889648438, -0.8625946044921875, -0.8244705200195312, -0.786346435546875, -0.7482223510742188, -0.7100982666015625, -0.6719741821289062, -0.63385009765625, -0.5957260131835938, -0.5576019287109375, -0.5194778442382812, -0.481353759765625, -0.44322967529296875, -0.4051055908203125, -0.36698150634765625, -0.328857421875, -0.29073333740234375, -0.2526092529296875, -0.21448516845703125, -0.176361083984375, -0.13823699951171875, -0.1001129150390625, -0.06198883056640625, -0.02386474609375, 0.01425933837890625, 0.0523834228515625, 0.09050750732421875, 0.128631591796875, 0.16675567626953125, 0.2048797607421875, 0.24300384521484375, 0.2811279296875, 0.31925201416015625, 0.3573760986328125, 0.39550018310546875, 0.433624267578125, 0.47174835205078125, 0.5098724365234375, 0.5479965209960938, 0.58612060546875, 0.6242446899414062, 0.6623687744140625, 0.7004928588867188, 0.738616943359375, 0.7767410278320312, 0.8148651123046875, 0.8529891967773438, 0.89111328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 15.0, 27.0, 39.0, 72.0, 169.0, 767.0, 2625.0, 158.0, 58.0, 44.0, 28.0, 12.0, 10.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2922325134277344, -0.27904510498046875, -0.2658576965332031, -0.2526702880859375, -0.23948287963867188, -0.22629547119140625, -0.21310806274414062, -0.199920654296875, -0.18673324584960938, -0.17354583740234375, -0.16035842895507812, -0.1471710205078125, -0.13398361206054688, -0.12079620361328125, -0.10760879516601562, -0.09442138671875, -0.08123397827148438, -0.06804656982421875, -0.054859161376953125, -0.0416717529296875, -0.028484344482421875, -0.01529693603515625, -0.002109527587890625, 0.011077880859375, 0.024265289306640625, 0.03745269775390625, 0.050640106201171875, 0.0638275146484375, 0.07701492309570312, 0.09020233154296875, 0.10338973999023438, 0.1165771484375, 0.12976455688476562, 0.14295196533203125, 0.15613937377929688, 0.1693267822265625, 0.18251419067382812, 0.19570159912109375, 0.20888900756835938, 0.222076416015625, 0.23526382446289062, 0.24845123291015625, 0.2616386413574219, 0.2748260498046875, 0.2880134582519531, 0.30120086669921875, 0.3143882751464844, 0.32757568359375, 0.3407630920410156, 0.35395050048828125, 0.3671379089355469, 0.3803253173828125, 0.3935127258300781, 0.40670013427734375, 0.4198875427246094, 0.433074951171875, 0.4462623596191406, 0.45944976806640625, 0.4726371765136719, 0.4858245849609375, 0.4990119934082031, 0.5121994018554688, 0.5253868103027344, 0.53857421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 6.0, 26.0, 78.0, 232.0, 384.0, 176.0, 57.0, 23.0, 12.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.161806344985962, -3.0679574012756348, -2.9741084575653076, -2.8802595138549805, -2.786410331726074, -2.692561388015747, -2.59871244430542, -2.5048635005950928, -2.4110145568847656, -2.3171656131744385, -2.2233166694641113, -2.129467725753784, -2.035618782043457, -1.9417697191238403, -1.8479206562042236, -1.7540717124938965, -1.6602227687835693, -1.5663738250732422, -1.472524881362915, -1.3786758184432983, -1.2848268747329712, -1.190977931022644, -1.0971288681030273, -1.0032799243927002, -0.909430980682373, -0.8155820369720459, -0.721733033657074, -0.627884030342102, -0.5340350866317749, -0.44018611311912537, -0.34633713960647583, -0.2524881362915039, -0.15863895416259766, -0.06478998064994812, 0.029058992862701416, 0.12290796637535095, 0.2167569398880005, 0.31060591340065, 0.40445488691329956, 0.4983038902282715, 0.5921528339385986, 0.6860017776489258, 0.7798507809638977, 0.8736997842788696, 0.9675487279891968, 1.061397671699524, 1.1552467346191406, 1.2490956783294678, 1.342944622039795, 1.436793565750122, 1.5306425094604492, 1.624491572380066, 1.718340516090393, 1.8121894598007202, 1.906038522720337, 1.999887466430664, 2.093736410140991, 2.1875853538513184, 2.2814342975616455, 2.3752832412719727, 2.469132423400879, 2.562981367111206, 2.656830310821533, 2.7506792545318604, 2.8445281982421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 12.0, 16.0, 20.0, 37.0, 44.0, 61.0, 74.0, 59.0, 74.0, 70.0, 77.0, 96.0, 74.0, 62.0, 51.0, 28.0, 34.0, 38.0, 20.0, 11.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4109008312225342, -1.3583920001983643, -1.3058831691741943, -1.2533743381500244, -1.2008655071258545, -1.1483566761016846, -1.0958478450775146, -1.0433388948440552, -0.9908300638198853, -0.9383212327957153, -0.8858124017715454, -0.8333035707473755, -0.7807946801185608, -0.7282858490943909, -0.675777018070221, -0.6232681274414062, -0.5707593560218811, -0.5182505249977112, -0.46574166417121887, -0.41323283314704895, -0.36072397232055664, -0.3082151412963867, -0.2557063102722168, -0.2031974494457245, -0.15068861842155457, -0.09817977249622345, -0.04567093402147293, 0.006837904453277588, 0.059346750378608704, 0.11185559630393982, 0.16436442732810974, 0.21687328815460205, 0.269382119178772, 0.3218909502029419, 0.3743998110294342, 0.4269086420536041, 0.47941750288009644, 0.5319263339042664, 0.5844351649284363, 0.636944055557251, 0.6894528865814209, 0.7419617176055908, 0.7944705486297607, 0.8469793796539307, 0.8994882702827454, 0.9519971013069153, 1.0045058727264404, 1.0570148229599, 1.1095235347747803, 1.1620323657989502, 1.2145411968231201, 1.26705002784729, 1.31955885887146, 1.3720676898956299, 1.4245765209197998, 1.4770854711532593, 1.5295943021774292, 1.5821031332015991, 1.634611964225769, 1.687120795249939, 1.7396296262741089, 1.7921385765075684, 1.8446474075317383, 1.8971562385559082, 1.9496650695800781]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 24.0, 33.0, 61.0, 87.0, 174.0, 393.0, 874.0, 2919.0, 21923.0, 929899.0, 84672.0, 4977.0, 1420.0, 466.0, 227.0, 129.0, 72.0, 44.0, 36.0, 25.0, 14.0, 6.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.412109375, -2.342559814453125, -2.27301025390625, -2.203460693359375, -2.1339111328125, -2.064361572265625, -1.99481201171875, -1.925262451171875, -1.855712890625, -1.786163330078125, -1.71661376953125, -1.647064208984375, -1.5775146484375, -1.507965087890625, -1.43841552734375, -1.368865966796875, -1.29931640625, -1.229766845703125, -1.16021728515625, -1.090667724609375, -1.0211181640625, -0.951568603515625, -0.88201904296875, -0.812469482421875, -0.742919921875, -0.673370361328125, -0.60382080078125, -0.534271240234375, -0.4647216796875, -0.395172119140625, -0.32562255859375, -0.256072998046875, -0.1865234375, -0.116973876953125, -0.04742431640625, 0.022125244140625, 0.0916748046875, 0.161224365234375, 0.23077392578125, 0.300323486328125, 0.369873046875, 0.439422607421875, 0.50897216796875, 0.578521728515625, 0.6480712890625, 0.717620849609375, 0.78717041015625, 0.856719970703125, 0.92626953125, 0.995819091796875, 1.06536865234375, 1.134918212890625, 1.2044677734375, 1.274017333984375, 1.34356689453125, 1.413116455078125, 1.482666015625, 1.552215576171875, 1.62176513671875, 1.691314697265625, 1.7608642578125, 1.830413818359375, 1.89996337890625, 1.969512939453125, 2.0390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 15.0, 43.0, 98.0, 139.0, 213.0, 218.0, 147.0, 65.0, 33.0, 13.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6937675476074219, -0.6775741577148438, -0.6613807678222656, -0.6451873779296875, -0.6289939880371094, -0.6128005981445312, -0.5966072082519531, -0.580413818359375, -0.5642204284667969, -0.5480270385742188, -0.5318336486816406, -0.5156402587890625, -0.4994468688964844, -0.48325347900390625, -0.4670600891113281, -0.45086669921875, -0.4346733093261719, -0.41847991943359375, -0.4022865295410156, -0.3860931396484375, -0.3698997497558594, -0.35370635986328125, -0.3375129699707031, -0.321319580078125, -0.3051261901855469, -0.28893280029296875, -0.2727394104003906, -0.2565460205078125, -0.24035263061523438, -0.22415924072265625, -0.20796585083007812, -0.1917724609375, -0.17557907104492188, -0.15938568115234375, -0.14319229125976562, -0.1269989013671875, -0.11080551147460938, -0.09461212158203125, -0.07841873168945312, -0.062225341796875, -0.046031951904296875, -0.02983856201171875, -0.013645172119140625, 0.0025482177734375, 0.018741607666015625, 0.03493499755859375, 0.051128387451171875, 0.06732177734375, 0.08351516723632812, 0.09970855712890625, 0.11590194702148438, 0.1320953369140625, 0.14828872680664062, 0.16448211669921875, 0.18067550659179688, 0.196868896484375, 0.21306228637695312, 0.22925567626953125, 0.24544906616210938, 0.2616424560546875, 0.2778358459472656, 0.29402923583984375, 0.3102226257324219, 0.326416015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 5.0, 13.0, 7.0, 20.0, 24.0, 36.0, 53.0, 88.0, 130.0, 276.0, 756.0, 2182.0, 8570.0, 55370.0, 736635.0, 216026.0, 21710.0, 4267.0, 1322.0, 505.0, 217.0, 120.0, 62.0, 34.0, 26.0, 36.0, 18.0, 11.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4228515625, -1.3841552734375, -1.345458984375, -1.3067626953125, -1.26806640625, -1.2293701171875, -1.190673828125, -1.1519775390625, -1.11328125, -1.0745849609375, -1.035888671875, -0.9971923828125, -0.95849609375, -0.9197998046875, -0.881103515625, -0.8424072265625, -0.8037109375, -0.7650146484375, -0.726318359375, -0.6876220703125, -0.64892578125, -0.6102294921875, -0.571533203125, -0.5328369140625, -0.494140625, -0.4554443359375, -0.416748046875, -0.3780517578125, -0.33935546875, -0.3006591796875, -0.261962890625, -0.2232666015625, -0.1845703125, -0.1458740234375, -0.107177734375, -0.0684814453125, -0.02978515625, 0.0089111328125, 0.047607421875, 0.0863037109375, 0.125, 0.1636962890625, 0.202392578125, 0.2410888671875, 0.27978515625, 0.3184814453125, 0.357177734375, 0.3958740234375, 0.4345703125, 0.4732666015625, 0.511962890625, 0.5506591796875, 0.58935546875, 0.6280517578125, 0.666748046875, 0.7054443359375, 0.744140625, 0.7828369140625, 0.821533203125, 0.8602294921875, 0.89892578125, 0.9376220703125, 0.976318359375, 1.0150146484375, 1.0537109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 13.0, 23.0, 16.0, 23.0, 23.0, 21.0, 46.0, 49.0, 46.0, 51.0, 59.0, 84.0, 86.0, 54.0, 63.0, 65.0, 42.0, 37.0, 34.0, 27.0, 29.0, 21.0, 19.0, 13.0, 9.0, 8.0, 7.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7454910278320312, -0.7160797119140625, -0.6866683959960938, -0.657257080078125, -0.6278457641601562, -0.5984344482421875, -0.5690231323242188, -0.53961181640625, -0.5102005004882812, -0.4807891845703125, -0.45137786865234375, -0.421966552734375, -0.39255523681640625, -0.3631439208984375, -0.33373260498046875, -0.3043212890625, -0.27490997314453125, -0.2454986572265625, -0.21608734130859375, -0.186676025390625, -0.15726470947265625, -0.1278533935546875, -0.09844207763671875, -0.06903076171875, -0.03961944580078125, -0.0102081298828125, 0.01920318603515625, 0.048614501953125, 0.07802581787109375, 0.1074371337890625, 0.13684844970703125, 0.166259765625, 0.19567108154296875, 0.2250823974609375, 0.25449371337890625, 0.283905029296875, 0.31331634521484375, 0.3427276611328125, 0.37213897705078125, 0.40155029296875, 0.43096160888671875, 0.4603729248046875, 0.48978424072265625, 0.519195556640625, 0.5486068725585938, 0.5780181884765625, 0.6074295043945312, 0.6368408203125, 0.6662521362304688, 0.6956634521484375, 0.7250747680664062, 0.754486083984375, 0.7838973999023438, 0.8133087158203125, 0.8427200317382812, 0.87213134765625, 0.9015426635742188, 0.9309539794921875, 0.9603652954101562, 0.989776611328125, 1.0191879272460938, 1.0485992431640625, 1.0780105590820312, 1.107421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 10.0, 3.0, 6.0, 16.0, 19.0, 35.0, 67.0, 136.0, 278.0, 759.0, 2383.0, 11664.0, 123056.0, 851382.0, 49440.0, 6720.0, 1596.0, 521.0, 193.0, 86.0, 58.0, 29.0, 30.0, 14.0, 9.0, 6.0, 12.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.3255500793457031, -0.31516265869140625, -0.3047752380371094, -0.2943878173828125, -0.2840003967285156, -0.27361297607421875, -0.2632255554199219, -0.252838134765625, -0.24245071411132812, -0.23206329345703125, -0.22167587280273438, -0.2112884521484375, -0.20090103149414062, -0.19051361083984375, -0.18012619018554688, -0.16973876953125, -0.15935134887695312, -0.14896392822265625, -0.13857650756835938, -0.1281890869140625, -0.11780166625976562, -0.10741424560546875, -0.09702682495117188, -0.086639404296875, -0.07625198364257812, -0.06586456298828125, -0.055477142333984375, -0.0450897216796875, -0.034702301025390625, -0.02431488037109375, -0.013927459716796875, -0.0035400390625, 0.006847381591796875, 0.01723480224609375, 0.027622222900390625, 0.0380096435546875, 0.048397064208984375, 0.05878448486328125, 0.06917190551757812, 0.079559326171875, 0.08994674682617188, 0.10033416748046875, 0.11072158813476562, 0.1211090087890625, 0.13149642944335938, 0.14188385009765625, 0.15227127075195312, 0.16265869140625, 0.17304611206054688, 0.18343353271484375, 0.19382095336914062, 0.2042083740234375, 0.21459579467773438, 0.22498321533203125, 0.23537063598632812, 0.245758056640625, 0.2561454772949219, 0.26653289794921875, 0.2769203186035156, 0.2873077392578125, 0.2976951599121094, 0.30808258056640625, 0.3184700012207031, 0.328857421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 9.0, 8.0, 13.0, 20.0, 17.0, 28.0, 40.0, 47.0, 72.0, 112.0, 107.0, 144.0, 104.0, 87.0, 47.0, 32.0, 22.0, 26.0, 8.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6927719116210938e-05, -1.6219913959503174e-05, -1.551210880279541e-05, -1.4804303646087646e-05, -1.4096498489379883e-05, -1.3388693332672119e-05, -1.2680888175964355e-05, -1.1973083019256592e-05, -1.1265277862548828e-05, -1.0557472705841064e-05, -9.8496675491333e-06, -9.141862392425537e-06, -8.434057235717773e-06, -7.72625207901001e-06, -7.018446922302246e-06, -6.310641765594482e-06, -5.602836608886719e-06, -4.895031452178955e-06, -4.187226295471191e-06, -3.4794211387634277e-06, -2.771615982055664e-06, -2.0638108253479004e-06, -1.3560056686401367e-06, -6.48200511932373e-07, 5.960464477539063e-08, 7.674098014831543e-07, 1.475214958190918e-06, 2.1830201148986816e-06, 2.8908252716064453e-06, 3.598630428314209e-06, 4.306435585021973e-06, 5.014240741729736e-06, 5.7220458984375e-06, 6.429851055145264e-06, 7.137656211853027e-06, 7.845461368560791e-06, 8.553266525268555e-06, 9.261071681976318e-06, 9.968876838684082e-06, 1.0676681995391846e-05, 1.138448715209961e-05, 1.2092292308807373e-05, 1.2800097465515137e-05, 1.35079026222229e-05, 1.4215707778930664e-05, 1.4923512935638428e-05, 1.563131809234619e-05, 1.6339123249053955e-05, 1.704692840576172e-05, 1.7754733562469482e-05, 1.8462538719177246e-05, 1.917034387588501e-05, 1.9878149032592773e-05, 2.0585954189300537e-05, 2.12937593460083e-05, 2.2001564502716064e-05, 2.2709369659423828e-05, 2.3417174816131592e-05, 2.4124979972839355e-05, 2.483278512954712e-05, 2.5540590286254883e-05, 2.6248395442962646e-05, 2.695620059967041e-05, 2.7664005756378174e-05, 2.8371810913085938e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 7.0, 7.0, 12.0, 16.0, 26.0, 34.0, 86.0, 161.0, 396.0, 1402.0, 7958.0, 145647.0, 870567.0, 18483.0, 2622.0, 627.0, 240.0, 110.0, 53.0, 22.0, 14.0, 20.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3597412109375, -0.345458984375, -0.3311767578125, -0.31689453125, -0.3026123046875, -0.288330078125, -0.2740478515625, -0.259765625, -0.2454833984375, -0.231201171875, -0.2169189453125, -0.20263671875, -0.1883544921875, -0.174072265625, -0.1597900390625, -0.1455078125, -0.1312255859375, -0.116943359375, -0.1026611328125, -0.08837890625, -0.0740966796875, -0.059814453125, -0.0455322265625, -0.03125, -0.0169677734375, -0.002685546875, 0.0115966796875, 0.02587890625, 0.0401611328125, 0.054443359375, 0.0687255859375, 0.0830078125, 0.0972900390625, 0.111572265625, 0.1258544921875, 0.14013671875, 0.1544189453125, 0.168701171875, 0.1829833984375, 0.197265625, 0.2115478515625, 0.225830078125, 0.2401123046875, 0.25439453125, 0.2686767578125, 0.282958984375, 0.2972412109375, 0.3115234375, 0.3258056640625, 0.340087890625, 0.3543701171875, 0.36865234375, 0.3829345703125, 0.397216796875, 0.4114990234375, 0.42578125, 0.4400634765625, 0.454345703125, 0.4686279296875, 0.48291015625, 0.4971923828125, 0.511474609375, 0.5257568359375, 0.5400390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 7.0, 15.0, 16.0, 35.0, 45.0, 66.0, 110.0, 138.0, 149.0, 123.0, 66.0, 60.0, 34.0, 23.0, 15.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15757369995117188, -0.15157318115234375, -0.14557266235351562, -0.1395721435546875, -0.13357162475585938, -0.12757110595703125, -0.12157058715820312, -0.115570068359375, -0.10956954956054688, -0.10356903076171875, -0.09756851196289062, -0.0915679931640625, -0.08556747436523438, -0.07956695556640625, -0.07356643676757812, -0.06756591796875, -0.061565399169921875, -0.05556488037109375, -0.049564361572265625, -0.0435638427734375, -0.037563323974609375, -0.03156280517578125, -0.025562286376953125, -0.019561767578125, -0.013561248779296875, -0.00756072998046875, -0.001560211181640625, 0.0044403076171875, 0.010440826416015625, 0.01644134521484375, 0.022441864013671875, 0.0284423828125, 0.034442901611328125, 0.04044342041015625, 0.046443939208984375, 0.0524444580078125, 0.058444976806640625, 0.06444549560546875, 0.07044601440429688, 0.076446533203125, 0.08244705200195312, 0.08844757080078125, 0.09444808959960938, 0.1004486083984375, 0.10644912719726562, 0.11244964599609375, 0.11845016479492188, 0.12445068359375, 0.13045120239257812, 0.13645172119140625, 0.14245223999023438, 0.1484527587890625, 0.15445327758789062, 0.16045379638671875, 0.16645431518554688, 0.172454833984375, 0.17845535278320312, 0.18445587158203125, 0.19045639038085938, 0.1964569091796875, 0.20245742797851562, 0.20845794677734375, 0.21445846557617188, 0.220458984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 13.0, 65.0, 278.0, 451.0, 142.0, 39.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.783329010009766, -21.350446701049805, -20.917564392089844, -20.484683990478516, -20.051801681518555, -19.618919372558594, -19.186037063598633, -18.753154754638672, -18.320274353027344, -17.887392044067383, -17.454509735107422, -17.021629333496094, -16.588747024536133, -16.155864715576172, -15.722982406616211, -15.290101051330566, -14.857217788696289, -14.424335479736328, -13.991454124450684, -13.558571815490723, -13.125690460205078, -12.692808151245117, -12.259925842285156, -11.827044486999512, -11.394163131713867, -10.961280822753906, -10.528399467468262, -10.0955171585083, -9.662635803222656, -9.229753494262695, -8.796871185302734, -8.36398983001709, -7.931107997894287, -7.498226165771484, -7.065344333648682, -6.632462501525879, -6.199580192565918, -5.766698360443115, -5.3338165283203125, -4.900934219360352, -4.468052864074707, -4.035171031951904, -3.6022889614105225, -3.1694071292877197, -2.736525058746338, -2.303643226623535, -1.8707613945007324, -1.4378793239593506, -1.0049972534179688, -0.5721153020858765, -0.13923341035842896, 0.29364848136901855, 0.7265304327011108, 1.1594123840332031, 1.5922942161560059, 2.0251762866973877, 2.4580581188201904, 2.890939950942993, 3.323822021484375, 3.7567038536071777, 4.1895856857299805, 4.622467994689941, 5.055349349975586, 5.488231658935547, 5.92111349105835]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 3.0, 7.0, 9.0, 18.0, 9.0, 14.0, 24.0, 23.0, 34.0, 34.0, 30.0, 34.0, 31.0, 40.0, 36.0, 45.0, 34.0, 52.0, 42.0, 47.0, 34.0, 54.0, 32.0, 37.0, 43.0, 34.0, 34.0, 25.0, 28.0, 22.0, 13.0, 16.0, 13.0, 9.0, 17.0, 3.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.39192008972168, -4.265620231628418, -4.139319896697998, -4.013020038604736, -3.8867197036743164, -3.7604198455810547, -3.634119749069214, -3.507819652557373, -3.3815195560455322, -3.2552194595336914, -3.1289193630218506, -3.0026192665100098, -2.876319408416748, -2.750019073486328, -2.6237192153930664, -2.4974191188812256, -2.3711190223693848, -2.244818925857544, -2.118518829345703, -1.9922188520431519, -1.865918755531311, -1.7396186590194702, -1.613318681716919, -1.4870185852050781, -1.3607184886932373, -1.2344183921813965, -1.1081182956695557, -0.9818183183670044, -0.8555182218551636, -0.7292181253433228, -0.6029180884361267, -0.47661805152893066, -0.35031771659851074, -0.2240176498889923, -0.09771758317947388, 0.028582483530044556, 0.154882550239563, 0.2811826467514038, 0.40748268365859985, 0.5337827205657959, 0.6600828170776367, 0.7863829135894775, 0.9126829504966736, 1.0389829874038696, 1.1652830839157104, 1.2915831804275513, 1.4178831577301025, 1.5441832542419434, 1.6704833507537842, 1.796783447265625, 1.9230835437774658, 2.0493836402893066, 2.1756834983825684, 2.3019838333129883, 2.42828369140625, 2.554583787918091, 2.6808838844299316, 2.8071839809417725, 2.9334840774536133, 3.059784173965454, 3.186084270477295, 3.3123841285705566, 3.4386842250823975, 3.5649843215942383, 3.691284418106079]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 10.0, 26.0, 25.0, 31.0, 48.0, 67.0, 83.0, 141.0, 232.0, 415.0, 907.0, 2314.0, 8263.0, 67130.0, 4062687.0, 42200.0, 6460.0, 1863.0, 702.0, 288.0, 146.0, 80.0, 37.0, 32.0, 17.0, 9.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4609375, -1.42803955078125, -1.3951416015625, -1.36224365234375, -1.329345703125, -1.29644775390625, -1.2635498046875, -1.23065185546875, -1.19775390625, -1.16485595703125, -1.1319580078125, -1.09906005859375, -1.066162109375, -1.03326416015625, -1.0003662109375, -0.96746826171875, -0.9345703125, -0.90167236328125, -0.8687744140625, -0.83587646484375, -0.802978515625, -0.77008056640625, -0.7371826171875, -0.70428466796875, -0.67138671875, -0.63848876953125, -0.6055908203125, -0.57269287109375, -0.539794921875, -0.50689697265625, -0.4739990234375, -0.44110107421875, -0.408203125, -0.37530517578125, -0.3424072265625, -0.30950927734375, -0.276611328125, -0.24371337890625, -0.2108154296875, -0.17791748046875, -0.14501953125, -0.11212158203125, -0.0792236328125, -0.04632568359375, -0.013427734375, 0.01947021484375, 0.0523681640625, 0.08526611328125, 0.1181640625, 0.15106201171875, 0.1839599609375, 0.21685791015625, 0.249755859375, 0.28265380859375, 0.3155517578125, 0.34844970703125, 0.38134765625, 0.41424560546875, 0.4471435546875, 0.48004150390625, 0.512939453125, 0.54583740234375, 0.5787353515625, 0.61163330078125, 0.64453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 18.0, 41.0, 75.0, 127.0, 169.0, 184.0, 146.0, 116.0, 67.0, 24.0, 15.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7386932373046875, -0.722015380859375, -0.7053375244140625, -0.68865966796875, -0.6719818115234375, -0.655303955078125, -0.6386260986328125, -0.6219482421875, -0.6052703857421875, -0.588592529296875, -0.5719146728515625, -0.55523681640625, -0.5385589599609375, -0.521881103515625, -0.5052032470703125, -0.488525390625, -0.4718475341796875, -0.455169677734375, -0.4384918212890625, -0.42181396484375, -0.4051361083984375, -0.388458251953125, -0.3717803955078125, -0.3551025390625, -0.3384246826171875, -0.321746826171875, -0.3050689697265625, -0.28839111328125, -0.2717132568359375, -0.255035400390625, -0.2383575439453125, -0.2216796875, -0.2050018310546875, -0.188323974609375, -0.1716461181640625, -0.15496826171875, -0.1382904052734375, -0.121612548828125, -0.1049346923828125, -0.0882568359375, -0.0715789794921875, -0.054901123046875, -0.0382232666015625, -0.02154541015625, -0.0048675537109375, 0.011810302734375, 0.0284881591796875, 0.045166015625, 0.0618438720703125, 0.078521728515625, 0.0951995849609375, 0.11187744140625, 0.1285552978515625, 0.145233154296875, 0.1619110107421875, 0.1785888671875, 0.1952667236328125, 0.211944580078125, 0.2286224365234375, 0.24530029296875, 0.2619781494140625, 0.278656005859375, 0.2953338623046875, 0.31201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 7.0, 14.0, 23.0, 54.0, 120.0, 260.0, 666.0, 1587.0, 3657.0, 11130.0, 57778.0, 3978020.0, 115552.0, 16466.0, 5120.0, 2133.0, 926.0, 421.0, 176.0, 73.0, 29.0, 20.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96533203125, -0.9374618530273438, -0.9095916748046875, -0.8817214965820312, -0.853851318359375, -0.8259811401367188, -0.7981109619140625, -0.7702407836914062, -0.74237060546875, -0.7145004272460938, -0.6866302490234375, -0.6587600708007812, -0.630889892578125, -0.6030197143554688, -0.5751495361328125, -0.5472793579101562, -0.5194091796875, -0.49153900146484375, -0.4636688232421875, -0.43579864501953125, -0.407928466796875, -0.38005828857421875, -0.3521881103515625, -0.32431793212890625, -0.29644775390625, -0.26857757568359375, -0.2407073974609375, -0.21283721923828125, -0.184967041015625, -0.15709686279296875, -0.1292266845703125, -0.10135650634765625, -0.073486328125, -0.04561614990234375, -0.0177459716796875, 0.01012420654296875, 0.037994384765625, 0.06586456298828125, 0.0937347412109375, 0.12160491943359375, 0.14947509765625, 0.17734527587890625, 0.2052154541015625, 0.23308563232421875, 0.260955810546875, 0.28882598876953125, 0.3166961669921875, 0.34456634521484375, 0.3724365234375, 0.40030670166015625, 0.4281768798828125, 0.45604705810546875, 0.483917236328125, 0.5117874145507812, 0.5396575927734375, 0.5675277709960938, 0.59539794921875, 0.6232681274414062, 0.6511383056640625, 0.6790084838867188, 0.706878662109375, 0.7347488403320312, 0.7626190185546875, 0.7904891967773438, 0.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 14.0, 28.0, 16.0, 27.0, 64.0, 108.0, 302.0, 2960.0, 264.0, 93.0, 37.0, 29.0, 21.0, 15.0, 17.0, 11.0, 8.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24819183349609375, -0.2397918701171875, -0.23139190673828125, -0.222991943359375, -0.21459197998046875, -0.2061920166015625, -0.19779205322265625, -0.18939208984375, -0.18099212646484375, -0.1725921630859375, -0.16419219970703125, -0.155792236328125, -0.14739227294921875, -0.1389923095703125, -0.13059234619140625, -0.1221923828125, -0.11379241943359375, -0.1053924560546875, -0.09699249267578125, -0.088592529296875, -0.08019256591796875, -0.0717926025390625, -0.06339263916015625, -0.05499267578125, -0.04659271240234375, -0.0381927490234375, -0.02979278564453125, -0.021392822265625, -0.01299285888671875, -0.0045928955078125, 0.00380706787109375, 0.01220703125, 0.02060699462890625, 0.0290069580078125, 0.03740692138671875, 0.045806884765625, 0.05420684814453125, 0.0626068115234375, 0.07100677490234375, 0.07940673828125, 0.08780670166015625, 0.0962066650390625, 0.10460662841796875, 0.113006591796875, 0.12140655517578125, 0.1298065185546875, 0.13820648193359375, 0.1466064453125, 0.15500640869140625, 0.1634063720703125, 0.17180633544921875, 0.180206298828125, 0.18860626220703125, 0.1970062255859375, 0.20540618896484375, 0.21380615234375, 0.22220611572265625, 0.2306060791015625, 0.23900604248046875, 0.247406005859375, 0.25580596923828125, 0.2642059326171875, 0.27260589599609375, 0.281005859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 10.0, 18.0, 25.0, 78.0, 225.0, 342.0, 199.0, 72.0, 18.0, 8.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5095571279525757, -1.4336057901382446, -1.3576544523239136, -1.2817031145095825, -1.205751657485962, -1.1298003196716309, -1.0538489818572998, -0.9778976440429688, -0.9019463062286377, -0.8259949684143066, -0.7500436305999756, -0.6740922331809998, -0.5981408953666687, -0.5221895575523376, -0.4462381899356842, -0.37028682231903076, -0.2943354845046997, -0.21838413178920746, -0.1424327790737152, -0.06648142635822296, 0.009469926357269287, 0.08542126417160034, 0.16137263178825378, 0.23732399940490723, 0.3132753372192383, 0.38922667503356934, 0.4651780426502228, 0.5411294102668762, 0.6170807480812073, 0.6930320858955383, 0.7689834833145142, 0.8449348211288452, 0.9208860397338867, 0.9968373775482178, 1.0727887153625488, 1.1487400531768799, 1.224691390991211, 1.300642728805542, 1.3765941858291626, 1.4525455236434937, 1.5284968614578247, 1.6044481992721558, 1.6803995370864868, 1.7563508749008179, 1.8323023319244385, 1.9082536697387695, 1.9842050075531006, 2.0601563453674316, 2.1361076831817627, 2.2120590209960938, 2.288010358810425, 2.363961696624756, 2.439913034439087, 2.515864372253418, 2.591815710067749, 2.66776704788208, 2.7437186241149902, 2.8196699619293213, 2.8956212997436523, 2.9715726375579834, 3.0475239753723145, 3.1234753131866455, 3.1994266510009766, 3.2753782272338867, 3.3513293266296387]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 6.0, 8.0, 19.0, 19.0, 47.0, 40.0, 49.0, 59.0, 57.0, 65.0, 65.0, 90.0, 79.0, 64.0, 74.0, 59.0, 37.0, 45.0, 27.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.409222960472107, -1.3669484853744507, -1.3246738910675049, -1.2823994159698486, -1.2401249408721924, -1.1978504657745361, -1.1555758714675903, -1.113301396369934, -1.0710268020629883, -1.028752326965332, -0.986477792263031, -0.94420325756073, -0.9019287824630737, -0.8596542477607727, -0.8173797130584717, -0.7751052379608154, -0.7328307628631592, -0.6905562281608582, -0.6482817530632019, -0.6060072183609009, -0.5637327432632446, -0.5214582085609436, -0.4791836738586426, -0.43690916895866394, -0.3946346640586853, -0.35236015915870667, -0.310085654258728, -0.267811119556427, -0.22553661465644836, -0.18326210975646973, -0.1409875750541687, -0.09871307015419006, -0.05643868446350098, -0.014164172112941742, 0.028110340237617493, 0.07038486003875732, 0.11265936493873596, 0.1549338698387146, 0.19720840454101562, 0.23948290944099426, 0.2817574143409729, 0.32403191924095154, 0.3663064241409302, 0.4085809588432312, 0.45085546374320984, 0.4931299686431885, 0.5354045033454895, 0.5776790380477905, 0.6199535131454468, 0.6622280478477478, 0.704502522945404, 0.7467770576477051, 0.7890515327453613, 0.8313260674476624, 0.8736006021499634, 0.9158750772476196, 0.9581496119499207, 1.0004241466522217, 1.042698621749878, 1.0849730968475342, 1.12724769115448, 1.1695221662521362, 1.211796760559082, 1.2540712356567383, 1.2963457107543945]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 3.0, 7.0, 4.0, 9.0, 15.0, 19.0, 21.0, 23.0, 38.0, 55.0, 129.0, 259.0, 525.0, 1215.0, 4196.0, 42626.0, 887011.0, 102476.0, 6845.0, 1667.0, 660.0, 346.0, 156.0, 85.0, 48.0, 29.0, 28.0, 12.0, 13.0, 7.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.21417236328125, -2.1568603515625, -2.09954833984375, -2.042236328125, -1.98492431640625, -1.9276123046875, -1.87030029296875, -1.81298828125, -1.75567626953125, -1.6983642578125, -1.64105224609375, -1.583740234375, -1.52642822265625, -1.4691162109375, -1.41180419921875, -1.3544921875, -1.29718017578125, -1.2398681640625, -1.18255615234375, -1.125244140625, -1.06793212890625, -1.0106201171875, -0.95330810546875, -0.89599609375, -0.83868408203125, -0.7813720703125, -0.72406005859375, -0.666748046875, -0.60943603515625, -0.5521240234375, -0.49481201171875, -0.4375, -0.38018798828125, -0.3228759765625, -0.26556396484375, -0.208251953125, -0.15093994140625, -0.0936279296875, -0.03631591796875, 0.02099609375, 0.07830810546875, 0.1356201171875, 0.19293212890625, 0.250244140625, 0.30755615234375, 0.3648681640625, 0.42218017578125, 0.4794921875, 0.53680419921875, 0.5941162109375, 0.65142822265625, 0.708740234375, 0.76605224609375, 0.8233642578125, 0.88067626953125, 0.93798828125, 0.99530029296875, 1.0526123046875, 1.10992431640625, 1.167236328125, 1.22454833984375, 1.2818603515625, 1.33917236328125, 1.396484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 34.0, 58.0, 85.0, 165.0, 167.0, 160.0, 131.0, 91.0, 52.0, 21.0, 10.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73486328125, -0.7188224792480469, -0.7027816772460938, -0.6867408752441406, -0.6707000732421875, -0.6546592712402344, -0.6386184692382812, -0.6225776672363281, -0.606536865234375, -0.5904960632324219, -0.5744552612304688, -0.5584144592285156, -0.5423736572265625, -0.5263328552246094, -0.5102920532226562, -0.4942512512207031, -0.47821044921875, -0.4621696472167969, -0.44612884521484375, -0.4300880432128906, -0.4140472412109375, -0.3980064392089844, -0.38196563720703125, -0.3659248352050781, -0.349884033203125, -0.3338432312011719, -0.31780242919921875, -0.3017616271972656, -0.2857208251953125, -0.2696800231933594, -0.25363922119140625, -0.23759841918945312, -0.2215576171875, -0.20551681518554688, -0.18947601318359375, -0.17343521118164062, -0.1573944091796875, -0.14135360717773438, -0.12531280517578125, -0.10927200317382812, -0.093231201171875, -0.07719039916992188, -0.06114959716796875, -0.045108795166015625, -0.0290679931640625, -0.013027191162109375, 0.00301361083984375, 0.019054412841796875, 0.03509521484375, 0.051136016845703125, 0.06717681884765625, 0.08321762084960938, 0.0992584228515625, 0.11529922485351562, 0.13134002685546875, 0.14738082885742188, 0.163421630859375, 0.17946243286132812, 0.19550323486328125, 0.21154403686523438, 0.2275848388671875, 0.24362564086914062, 0.25966644287109375, 0.2757072448730469, 0.291748046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 19.0, 14.0, 12.0, 23.0, 29.0, 48.0, 64.0, 94.0, 194.0, 413.0, 1113.0, 3450.0, 13706.0, 87596.0, 759456.0, 154933.0, 20334.0, 4593.0, 1352.0, 516.0, 213.0, 108.0, 67.0, 45.0, 36.0, 22.0, 31.0, 11.0, 10.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0498046875, -1.01312255859375, -0.9764404296875, -0.93975830078125, -0.903076171875, -0.86639404296875, -0.8297119140625, -0.79302978515625, -0.75634765625, -0.71966552734375, -0.6829833984375, -0.64630126953125, -0.609619140625, -0.57293701171875, -0.5362548828125, -0.49957275390625, -0.462890625, -0.42620849609375, -0.3895263671875, -0.35284423828125, -0.316162109375, -0.27947998046875, -0.2427978515625, -0.20611572265625, -0.16943359375, -0.13275146484375, -0.0960693359375, -0.05938720703125, -0.022705078125, 0.01397705078125, 0.0506591796875, 0.08734130859375, 0.1240234375, 0.16070556640625, 0.1973876953125, 0.23406982421875, 0.270751953125, 0.30743408203125, 0.3441162109375, 0.38079833984375, 0.41748046875, 0.45416259765625, 0.4908447265625, 0.52752685546875, 0.564208984375, 0.60089111328125, 0.6375732421875, 0.67425537109375, 0.7109375, 0.74761962890625, 0.7843017578125, 0.82098388671875, 0.857666015625, 0.89434814453125, 0.9310302734375, 0.96771240234375, 1.00439453125, 1.04107666015625, 1.0777587890625, 1.11444091796875, 1.151123046875, 1.18780517578125, 1.2244873046875, 1.26116943359375, 1.2978515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 2.0, 9.0, 15.0, 24.0, 16.0, 28.0, 22.0, 27.0, 33.0, 45.0, 37.0, 55.0, 54.0, 51.0, 45.0, 56.0, 67.0, 61.0, 57.0, 52.0, 37.0, 31.0, 34.0, 27.0, 21.0, 13.0, 13.0, 9.0, 14.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.94091796875, -0.9139404296875, -0.886962890625, -0.8599853515625, -0.8330078125, -0.8060302734375, -0.779052734375, -0.7520751953125, -0.72509765625, -0.6981201171875, -0.671142578125, -0.6441650390625, -0.6171875, -0.5902099609375, -0.563232421875, -0.5362548828125, -0.50927734375, -0.4822998046875, -0.455322265625, -0.4283447265625, -0.4013671875, -0.3743896484375, -0.347412109375, -0.3204345703125, -0.29345703125, -0.2664794921875, -0.239501953125, -0.2125244140625, -0.185546875, -0.1585693359375, -0.131591796875, -0.1046142578125, -0.07763671875, -0.0506591796875, -0.023681640625, 0.0032958984375, 0.0302734375, 0.0572509765625, 0.084228515625, 0.1112060546875, 0.13818359375, 0.1651611328125, 0.192138671875, 0.2191162109375, 0.24609375, 0.2730712890625, 0.300048828125, 0.3270263671875, 0.35400390625, 0.3809814453125, 0.407958984375, 0.4349365234375, 0.4619140625, 0.4888916015625, 0.515869140625, 0.5428466796875, 0.56982421875, 0.5968017578125, 0.623779296875, 0.6507568359375, 0.677734375, 0.7047119140625, 0.731689453125, 0.7586669921875, 0.78564453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 12.0, 19.0, 23.0, 39.0, 55.0, 99.0, 188.0, 492.0, 2039.0, 13718.0, 441339.0, 571901.0, 15451.0, 2163.0, 553.0, 207.0, 99.0, 52.0, 40.0, 13.0, 7.0, 9.0, 6.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4485359191894531, -0.42905426025390625, -0.4095726013183594, -0.3900909423828125, -0.3706092834472656, -0.35112762451171875, -0.3316459655761719, -0.312164306640625, -0.2926826477050781, -0.27320098876953125, -0.2537193298339844, -0.2342376708984375, -0.21475601196289062, -0.19527435302734375, -0.17579269409179688, -0.15631103515625, -0.13682937622070312, -0.11734771728515625, -0.09786605834960938, -0.0783843994140625, -0.058902740478515625, -0.03942108154296875, -0.019939422607421875, -0.000457763671875, 0.019023895263671875, 0.03850555419921875, 0.057987213134765625, 0.0774688720703125, 0.09695053100585938, 0.11643218994140625, 0.13591384887695312, 0.1553955078125, 0.17487716674804688, 0.19435882568359375, 0.21384048461914062, 0.2333221435546875, 0.2528038024902344, 0.27228546142578125, 0.2917671203613281, 0.311248779296875, 0.3307304382324219, 0.35021209716796875, 0.3696937561035156, 0.3891754150390625, 0.4086570739746094, 0.42813873291015625, 0.4476203918457031, 0.46710205078125, 0.4865837097167969, 0.5060653686523438, 0.5255470275878906, 0.5450286865234375, 0.5645103454589844, 0.5839920043945312, 0.6034736633300781, 0.622955322265625, 0.6424369812011719, 0.6619186401367188, 0.6814002990722656, 0.7008819580078125, 0.7203636169433594, 0.7398452758789062, 0.7593269348144531, 0.77880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 13.0, 18.0, 24.0, 44.0, 131.0, 377.0, 217.0, 77.0, 38.0, 18.0, 17.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -2.9535964131355286e-05, -2.7004629373550415e-05, -2.4473294615745544e-05, -2.1941959857940674e-05, -1.9410625100135803e-05, -1.6879290342330933e-05, -1.4347955584526062e-05, -1.1816620826721191e-05, -9.28528606891632e-06, -6.75395131111145e-06, -4.22261655330658e-06, -1.691281795501709e-06, 8.400529623031616e-07, 3.3713877201080322e-06, 5.902722477912903e-06, 8.434057235717773e-06, 1.0965391993522644e-05, 1.3496726751327515e-05, 1.6028061509132385e-05, 1.8559396266937256e-05, 2.1090731024742126e-05, 2.3622065782546997e-05, 2.6153400540351868e-05, 2.8684735298156738e-05, 3.121607005596161e-05, 3.374740481376648e-05, 3.627873957157135e-05, 3.881007432937622e-05, 4.134140908718109e-05, 4.387274384498596e-05, 4.640407860279083e-05, 4.89354133605957e-05, 5.1466748118400574e-05, 5.3998082876205444e-05, 5.6529417634010315e-05, 5.9060752391815186e-05, 6.159208714962006e-05, 6.412342190742493e-05, 6.66547566652298e-05, 6.918609142303467e-05, 7.171742618083954e-05, 7.424876093864441e-05, 7.678009569644928e-05, 7.931143045425415e-05, 8.184276521205902e-05, 8.437409996986389e-05, 8.690543472766876e-05, 8.943676948547363e-05, 9.19681042432785e-05, 9.449943900108337e-05, 9.703077375888824e-05, 9.956210851669312e-05, 0.00010209344327449799, 0.00010462477803230286, 0.00010715611279010773, 0.0001096874475479126, 0.00011221878230571747, 0.00011475011706352234, 0.00011728145182132721, 0.00011981278657913208, 0.00012234412133693695, 0.00012487545609474182, 0.0001274067908525467, 0.00012993812561035156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 12.0, 28.0, 58.0, 93.0, 198.0, 616.0, 5950.0, 958701.0, 80393.0, 1902.0, 348.0, 125.0, 48.0, 43.0, 21.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.719329833984375, -0.68475341796875, -0.650177001953125, -0.6156005859375, -0.581024169921875, -0.54644775390625, -0.511871337890625, -0.477294921875, -0.442718505859375, -0.40814208984375, -0.373565673828125, -0.3389892578125, -0.304412841796875, -0.26983642578125, -0.235260009765625, -0.20068359375, -0.166107177734375, -0.13153076171875, -0.096954345703125, -0.0623779296875, -0.027801513671875, 0.00677490234375, 0.041351318359375, 0.075927734375, 0.110504150390625, 0.14508056640625, 0.179656982421875, 0.2142333984375, 0.248809814453125, 0.28338623046875, 0.317962646484375, 0.3525390625, 0.387115478515625, 0.42169189453125, 0.456268310546875, 0.4908447265625, 0.525421142578125, 0.55999755859375, 0.594573974609375, 0.629150390625, 0.663726806640625, 0.69830322265625, 0.732879638671875, 0.7674560546875, 0.802032470703125, 0.83660888671875, 0.871185302734375, 0.90576171875, 0.940338134765625, 0.97491455078125, 1.009490966796875, 1.0440673828125, 1.078643798828125, 1.11322021484375, 1.147796630859375, 1.182373046875, 1.216949462890625, 1.25152587890625, 1.286102294921875, 1.3206787109375, 1.355255126953125, 1.38983154296875, 1.424407958984375, 1.458984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 30.0, 54.0, 108.0, 241.0, 288.0, 148.0, 49.0, 20.0, 15.0, 13.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9326629638671875, -0.913665771484375, -0.8946685791015625, -0.87567138671875, -0.8566741943359375, -0.837677001953125, -0.8186798095703125, -0.7996826171875, -0.7806854248046875, -0.761688232421875, -0.7426910400390625, -0.72369384765625, -0.7046966552734375, -0.685699462890625, -0.6667022705078125, -0.647705078125, -0.6287078857421875, -0.609710693359375, -0.5907135009765625, -0.57171630859375, -0.5527191162109375, -0.533721923828125, -0.5147247314453125, -0.4957275390625, -0.4767303466796875, -0.457733154296875, -0.4387359619140625, -0.41973876953125, -0.4007415771484375, -0.381744384765625, -0.3627471923828125, -0.34375, -0.3247528076171875, -0.305755615234375, -0.2867584228515625, -0.26776123046875, -0.2487640380859375, -0.229766845703125, -0.2107696533203125, -0.1917724609375, -0.1727752685546875, -0.153778076171875, -0.1347808837890625, -0.11578369140625, -0.0967864990234375, -0.077789306640625, -0.0587921142578125, -0.039794921875, -0.0207977294921875, -0.001800537109375, 0.0171966552734375, 0.03619384765625, 0.0551910400390625, 0.074188232421875, 0.0931854248046875, 0.1121826171875, 0.1311798095703125, 0.150177001953125, 0.1691741943359375, 0.18817138671875, 0.2071685791015625, 0.226165771484375, 0.2451629638671875, 0.26416015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 49.0, 98.0, 268.0, 320.0, 139.0, 58.0, 28.0, 13.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.300485610961914, -12.002562522888184, -11.704639434814453, -11.406717300415039, -11.108794212341309, -10.810871124267578, -10.512948989868164, -10.215025901794434, -9.917102813720703, -9.619179725646973, -9.321256637573242, -9.023334503173828, -8.725411415100098, -8.427488327026367, -8.129566192626953, -7.831643104553223, -7.533720016479492, -7.235796928405762, -6.9378743171691895, -6.639951705932617, -6.342028617858887, -6.044105529785156, -5.746182918548584, -5.448260307312012, -5.150337219238281, -4.852414131164551, -4.5544915199279785, -4.256568908691406, -3.958645820617676, -3.6607229709625244, -3.362800121307373, -3.0648772716522217, -2.766953945159912, -2.4690310955047607, -2.1711082458496094, -1.873185396194458, -1.5752625465393066, -1.2773396968841553, -0.9794168472290039, -0.6814939975738525, -0.38357114791870117, -0.0856482982635498, 0.21227455139160156, 0.5101974010467529, 0.8081202507019043, 1.1060431003570557, 1.403965950012207, 1.7018887996673584, 1.9998116493225098, 2.297734498977661, 2.5956573486328125, 2.893580198287964, 3.1915030479431152, 3.4894258975982666, 3.787348747253418, 4.085271835327148, 4.383194446563721, 4.681117057800293, 4.979040145874023, 5.276963233947754, 5.574885845184326, 5.872808456420898, 6.170731544494629, 6.468654632568359, 6.766577243804932]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 6.0, 9.0, 15.0, 14.0, 4.0, 13.0, 12.0, 18.0, 23.0, 23.0, 21.0, 33.0, 23.0, 32.0, 44.0, 43.0, 37.0, 41.0, 34.0, 36.0, 37.0, 37.0, 39.0, 41.0, 38.0, 34.0, 33.0, 32.0, 29.0, 26.0, 38.0, 24.0, 12.0, 14.0, 18.0, 5.0, 11.0, 11.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060755968093872, -2.9560089111328125, -2.851261615753174, -2.7465145587921143, -2.6417675018310547, -2.537020206451416, -2.4322731494903564, -2.327526092529297, -2.222778797149658, -2.1180317401885986, -2.01328444480896, -1.9085373878479004, -1.8037902116775513, -1.6990430355072021, -1.5942959785461426, -1.4895488023757935, -1.3848016262054443, -1.2800544500350952, -1.175307273864746, -1.0705602169036865, -0.9658130407333374, -0.8610658645629883, -0.7563187479972839, -0.6515716314315796, -0.5468244552612305, -0.44207730889320374, -0.337330162525177, -0.23258301615715027, -0.12783586978912354, -0.023088693618774414, 0.08165842294692993, 0.18640553951263428, 0.2911524772644043, 0.39589962363243103, 0.5006467700004578, 0.6053938865661621, 0.7101410627365112, 0.8148882389068604, 0.9196353554725647, 1.024382472038269, 1.1291296482086182, 1.2338768243789673, 1.3386240005493164, 1.443371057510376, 1.548118233680725, 1.6528654098510742, 1.7576124668121338, 1.862359642982483, 1.967106819152832, 2.0718538761138916, 2.1766011714935303, 2.28134822845459, 2.3860955238342285, 2.490842580795288, 2.5955896377563477, 2.7003369331359863, 2.805083990097046, 2.9098310470581055, 3.014578342437744, 3.1193253993988037, 3.2240724563598633, 3.328819751739502, 3.4335668087005615, 3.538313865661621, 3.6430611610412598]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 7.0, 7.0, 11.0, 15.0, 10.0, 34.0, 48.0, 102.0, 205.0, 426.0, 1105.0, 4347.0, 75013.0, 4100315.0, 9852.0, 1778.0, 546.0, 229.0, 104.0, 44.0, 32.0, 13.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.0859375, -4.9781951904296875, -4.870452880859375, -4.7627105712890625, -4.65496826171875, -4.5472259521484375, -4.439483642578125, -4.3317413330078125, -4.2239990234375, -4.1162567138671875, -4.008514404296875, -3.9007720947265625, -3.79302978515625, -3.6852874755859375, -3.577545166015625, -3.4698028564453125, -3.362060546875, -3.2543182373046875, -3.146575927734375, -3.0388336181640625, -2.93109130859375, -2.8233489990234375, -2.715606689453125, -2.6078643798828125, -2.5001220703125, -2.3923797607421875, -2.284637451171875, -2.1768951416015625, -2.06915283203125, -1.9614105224609375, -1.853668212890625, -1.7459259033203125, -1.63818359375, -1.5304412841796875, -1.422698974609375, -1.3149566650390625, -1.20721435546875, -1.0994720458984375, -0.991729736328125, -0.8839874267578125, -0.7762451171875, -0.6685028076171875, -0.560760498046875, -0.4530181884765625, -0.34527587890625, -0.2375335693359375, -0.129791259765625, -0.0220489501953125, 0.085693359375, 0.1934356689453125, 0.301177978515625, 0.4089202880859375, 0.51666259765625, 0.6244049072265625, 0.732147216796875, 0.8398895263671875, 0.9476318359375, 1.0553741455078125, 1.163116455078125, 1.2708587646484375, 1.37860107421875, 1.4863433837890625, 1.594085693359375, 1.7018280029296875, 1.8095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 16.0, 26.0, 43.0, 79.0, 107.0, 144.0, 154.0, 133.0, 118.0, 85.0, 42.0, 24.0, 13.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.759765625, -0.7434196472167969, -0.7270736694335938, -0.7107276916503906, -0.6943817138671875, -0.6780357360839844, -0.6616897583007812, -0.6453437805175781, -0.628997802734375, -0.6126518249511719, -0.5963058471679688, -0.5799598693847656, -0.5636138916015625, -0.5472679138183594, -0.5309219360351562, -0.5145759582519531, -0.49822998046875, -0.4818840026855469, -0.46553802490234375, -0.4491920471191406, -0.4328460693359375, -0.4165000915527344, -0.40015411376953125, -0.3838081359863281, -0.367462158203125, -0.3511161804199219, -0.33477020263671875, -0.3184242248535156, -0.3020782470703125, -0.2857322692871094, -0.26938629150390625, -0.2530403137207031, -0.2366943359375, -0.22034835815429688, -0.20400238037109375, -0.18765640258789062, -0.1713104248046875, -0.15496444702148438, -0.13861846923828125, -0.12227249145507812, -0.105926513671875, -0.08958053588867188, -0.07323455810546875, -0.056888580322265625, -0.0405426025390625, -0.024196624755859375, -0.00785064697265625, 0.008495330810546875, 0.02484130859375, 0.041187286376953125, 0.05753326416015625, 0.07387924194335938, 0.0902252197265625, 0.10657119750976562, 0.12291717529296875, 0.13926315307617188, 0.155609130859375, 0.17195510864257812, 0.18830108642578125, 0.20464706420898438, 0.2209930419921875, 0.23733901977539062, 0.25368499755859375, 0.2700309753417969, 0.286376953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 5.0, 9.0, 18.0, 23.0, 35.0, 49.0, 98.0, 133.0, 209.0, 397.0, 695.0, 1558.0, 3836.0, 11837.0, 54698.0, 3874788.0, 208041.0, 25037.0, 7281.0, 2753.0, 1226.0, 582.0, 361.0, 217.0, 150.0, 96.0, 42.0, 42.0, 18.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.33203125, -1.2947845458984375, -1.257537841796875, -1.2202911376953125, -1.18304443359375, -1.1457977294921875, -1.108551025390625, -1.0713043212890625, -1.0340576171875, -0.9968109130859375, -0.959564208984375, -0.9223175048828125, -0.88507080078125, -0.8478240966796875, -0.810577392578125, -0.7733306884765625, -0.736083984375, -0.6988372802734375, -0.661590576171875, -0.6243438720703125, -0.58709716796875, -0.5498504638671875, -0.512603759765625, -0.4753570556640625, -0.4381103515625, -0.4008636474609375, -0.363616943359375, -0.3263702392578125, -0.28912353515625, -0.2518768310546875, -0.214630126953125, -0.1773834228515625, -0.14013671875, -0.1028900146484375, -0.065643310546875, -0.0283966064453125, 0.00885009765625, 0.0460968017578125, 0.083343505859375, 0.1205902099609375, 0.1578369140625, 0.1950836181640625, 0.232330322265625, 0.2695770263671875, 0.30682373046875, 0.3440704345703125, 0.381317138671875, 0.4185638427734375, 0.455810546875, 0.4930572509765625, 0.530303955078125, 0.5675506591796875, 0.60479736328125, 0.6420440673828125, 0.679290771484375, 0.7165374755859375, 0.7537841796875, 0.7910308837890625, 0.828277587890625, 0.8655242919921875, 0.90277099609375, 0.9400177001953125, 0.977264404296875, 1.0145111083984375, 1.0517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 19.0, 23.0, 33.0, 63.0, 123.0, 769.0, 2628.0, 153.0, 66.0, 48.0, 33.0, 18.0, 12.0, 14.0, 11.0, 8.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.34137725830078125, -0.3277740478515625, -0.31417083740234375, -0.300567626953125, -0.28696441650390625, -0.2733612060546875, -0.25975799560546875, -0.24615478515625, -0.23255157470703125, -0.2189483642578125, -0.20534515380859375, -0.191741943359375, -0.17813873291015625, -0.1645355224609375, -0.15093231201171875, -0.1373291015625, -0.12372589111328125, -0.1101226806640625, -0.09651947021484375, -0.082916259765625, -0.06931304931640625, -0.0557098388671875, -0.04210662841796875, -0.02850341796875, -0.01490020751953125, -0.0012969970703125, 0.01230621337890625, 0.025909423828125, 0.03951263427734375, 0.0531158447265625, 0.06671905517578125, 0.080322265625, 0.09392547607421875, 0.1075286865234375, 0.12113189697265625, 0.134735107421875, 0.14833831787109375, 0.1619415283203125, 0.17554473876953125, 0.18914794921875, 0.20275115966796875, 0.2163543701171875, 0.22995758056640625, 0.243560791015625, 0.25716400146484375, 0.2707672119140625, 0.28437042236328125, 0.2979736328125, 0.31157684326171875, 0.3251800537109375, 0.33878326416015625, 0.352386474609375, 0.36598968505859375, 0.3795928955078125, 0.39319610595703125, 0.40679931640625, 0.42040252685546875, 0.4340057373046875, 0.44760894775390625, 0.461212158203125, 0.47481536865234375, 0.4884185791015625, 0.5020217895507812, 0.515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 53.0, 248.0, 441.0, 164.0, 52.0, 24.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.920597076416016, -4.764099597930908, -4.607602596282959, -4.451105117797852, -4.294608116149902, -4.138110637664795, -3.9816133975982666, -3.8251161575317383, -3.66861891746521, -3.5121216773986816, -3.3556244373321533, -3.199127197265625, -3.0426297187805176, -2.8861327171325684, -2.729635238647461, -2.5731379985809326, -2.4166407585144043, -2.260143518447876, -2.1036462783813477, -1.9471489191055298, -1.7906516790390015, -1.6341544389724731, -1.4776570796966553, -1.321159839630127, -1.1646625995635986, -1.0081653594970703, -0.8516680598258972, -0.6951707601547241, -0.5386735200881958, -0.3821762800216675, -0.22567898035049438, -0.06918168067932129, 0.08731555938720703, 0.24381282925605774, 0.40031009912490845, 0.5568073987960815, 0.7133046388626099, 0.8698018789291382, 1.026299238204956, 1.1827964782714844, 1.3392937183380127, 1.495790958404541, 1.6522881984710693, 1.8087855577468872, 1.9652827978134155, 2.1217799186706543, 2.2782773971557617, 2.43477463722229, 2.5912718772888184, 2.7477691173553467, 2.904266357421875, 3.0607635974884033, 3.2172608375549316, 3.373758316040039, 3.5302555561065674, 3.6867527961730957, 3.843250036239624, 3.9997472763061523, 4.15624475479126, 4.312741756439209, 4.469239234924316, 4.625736236572266, 4.782233715057373, 4.9387311935424805, 5.09522819519043]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 15.0, 16.0, 22.0, 27.0, 49.0, 62.0, 70.0, 82.0, 85.0, 96.0, 81.0, 84.0, 78.0, 62.0, 47.0, 36.0, 40.0, 16.0, 14.0, 4.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9566502571105957, -1.8838406801223755, -1.8110312223434448, -1.7382216453552246, -1.665412187576294, -1.5926026105880737, -1.5197930335998535, -1.4469835758209229, -1.3741739988327026, -1.3013644218444824, -1.2285549640655518, -1.1557453870773315, -1.0829358100891113, -1.0101263523101807, -0.9373167753219604, -0.864507257938385, -0.7916977405548096, -0.7188882231712341, -0.6460787057876587, -0.5732691287994385, -0.500459611415863, -0.4276500940322876, -0.35484054684638977, -0.28203099966049194, -0.2092214822769165, -0.13641194999217987, -0.06360241770744324, 0.009207114577293396, 0.08201664686203003, 0.15482616424560547, 0.2276357114315033, 0.3004452586174011, 0.37325501441955566, 0.4460645318031311, 0.5188740491867065, 0.5916836261749268, 0.6644931435585022, 0.7373026609420776, 0.8101122379302979, 0.8829217553138733, 0.9557312726974487, 1.028540849685669, 1.1013503074645996, 1.1741598844528198, 1.24696946144104, 1.3197789192199707, 1.392588496208191, 1.4653980731964111, 1.5382075309753418, 1.611017107963562, 1.6838265657424927, 1.756636142730713, 1.8294456005096436, 1.9022551774978638, 1.975064754486084, 2.0478742122650146, 2.1206836700439453, 2.193493127822876, 2.2663028240203857, 2.3391122817993164, 2.411921739578247, 2.4847311973571777, 2.5575408935546875, 2.630350351333618, 2.703160047531128]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 9.0, 14.0, 20.0, 12.0, 22.0, 48.0, 50.0, 69.0, 102.0, 143.0, 369.0, 612.0, 1397.0, 3723.0, 14554.0, 80670.0, 683550.0, 222724.0, 29541.0, 6764.0, 2189.0, 865.0, 441.0, 237.0, 96.0, 94.0, 43.0, 51.0, 29.0, 25.0, 15.0, 10.0, 7.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.5573577880859375, -1.508270263671875, -1.4591827392578125, -1.41009521484375, -1.3610076904296875, -1.311920166015625, -1.2628326416015625, -1.2137451171875, -1.1646575927734375, -1.115570068359375, -1.0664825439453125, -1.01739501953125, -0.9683074951171875, -0.919219970703125, -0.8701324462890625, -0.821044921875, -0.7719573974609375, -0.722869873046875, -0.6737823486328125, -0.62469482421875, -0.5756072998046875, -0.526519775390625, -0.4774322509765625, -0.4283447265625, -0.3792572021484375, -0.330169677734375, -0.2810821533203125, -0.23199462890625, -0.1829071044921875, -0.133819580078125, -0.0847320556640625, -0.03564453125, 0.0134429931640625, 0.062530517578125, 0.1116180419921875, 0.16070556640625, 0.2097930908203125, 0.258880615234375, 0.3079681396484375, 0.3570556640625, 0.4061431884765625, 0.455230712890625, 0.5043182373046875, 0.55340576171875, 0.6024932861328125, 0.651580810546875, 0.7006683349609375, 0.749755859375, 0.7988433837890625, 0.847930908203125, 0.8970184326171875, 0.94610595703125, 0.9951934814453125, 1.044281005859375, 1.0933685302734375, 1.1424560546875, 1.1915435791015625, 1.240631103515625, 1.2897186279296875, 1.33880615234375, 1.3878936767578125, 1.436981201171875, 1.4860687255859375, 1.53515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 20.0, 20.0, 46.0, 80.0, 87.0, 129.0, 129.0, 133.0, 115.0, 95.0, 63.0, 31.0, 19.0, 13.0, 14.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.72998046875, -0.7140464782714844, -0.6981124877929688, -0.6821784973144531, -0.6662445068359375, -0.6503105163574219, -0.6343765258789062, -0.6184425354003906, -0.602508544921875, -0.5865745544433594, -0.5706405639648438, -0.5547065734863281, -0.5387725830078125, -0.5228385925292969, -0.5069046020507812, -0.4909706115722656, -0.47503662109375, -0.4591026306152344, -0.44316864013671875, -0.4272346496582031, -0.4113006591796875, -0.3953666687011719, -0.37943267822265625, -0.3634986877441406, -0.347564697265625, -0.3316307067871094, -0.31569671630859375, -0.2997627258300781, -0.2838287353515625, -0.2678947448730469, -0.25196075439453125, -0.23602676391601562, -0.2200927734375, -0.20415878295898438, -0.18822479248046875, -0.17229080200195312, -0.1563568115234375, -0.14042282104492188, -0.12448883056640625, -0.10855484008789062, -0.092620849609375, -0.07668685913085938, -0.06075286865234375, -0.044818878173828125, -0.0288848876953125, -0.012950897216796875, 0.00298309326171875, 0.018917083740234375, 0.03485107421875, 0.050785064697265625, 0.06671905517578125, 0.08265304565429688, 0.0985870361328125, 0.11452102661132812, 0.13045501708984375, 0.14638900756835938, 0.162322998046875, 0.17825698852539062, 0.19419097900390625, 0.21012496948242188, 0.2260589599609375, 0.24199295043945312, 0.25792694091796875, 0.2738609313964844, 0.289794921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 14.0, 13.0, 21.0, 25.0, 39.0, 55.0, 81.0, 140.0, 228.0, 427.0, 776.0, 1597.0, 3513.0, 9316.0, 30409.0, 141664.0, 665351.0, 146531.0, 31341.0, 9604.0, 3676.0, 1705.0, 826.0, 463.0, 278.0, 166.0, 89.0, 58.0, 53.0, 23.0, 18.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1819610595703125, -1.143218994140625, -1.1044769287109375, -1.06573486328125, -1.0269927978515625, -0.988250732421875, -0.9495086669921875, -0.9107666015625, -0.8720245361328125, -0.833282470703125, -0.7945404052734375, -0.75579833984375, -0.7170562744140625, -0.678314208984375, -0.6395721435546875, -0.600830078125, -0.5620880126953125, -0.523345947265625, -0.4846038818359375, -0.44586181640625, -0.4071197509765625, -0.368377685546875, -0.3296356201171875, -0.2908935546875, -0.2521514892578125, -0.213409423828125, -0.1746673583984375, -0.13592529296875, -0.0971832275390625, -0.058441162109375, -0.0196990966796875, 0.01904296875, 0.0577850341796875, 0.096527099609375, 0.1352691650390625, 0.17401123046875, 0.2127532958984375, 0.251495361328125, 0.2902374267578125, 0.3289794921875, 0.3677215576171875, 0.406463623046875, 0.4452056884765625, 0.48394775390625, 0.5226898193359375, 0.561431884765625, 0.6001739501953125, 0.638916015625, 0.6776580810546875, 0.716400146484375, 0.7551422119140625, 0.79388427734375, 0.8326263427734375, 0.871368408203125, 0.9101104736328125, 0.9488525390625, 0.9875946044921875, 1.026336669921875, 1.0650787353515625, 1.10382080078125, 1.1425628662109375, 1.181304931640625, 1.2200469970703125, 1.2587890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 7.0, 12.0, 16.0, 21.0, 30.0, 40.0, 39.0, 44.0, 59.0, 60.0, 57.0, 70.0, 71.0, 85.0, 71.0, 63.0, 47.0, 46.0, 29.0, 27.0, 25.0, 16.0, 7.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4111785888671875, -1.362396240234375, -1.3136138916015625, -1.26483154296875, -1.2160491943359375, -1.167266845703125, -1.1184844970703125, -1.0697021484375, -1.0209197998046875, -0.972137451171875, -0.9233551025390625, -0.87457275390625, -0.8257904052734375, -0.777008056640625, -0.7282257080078125, -0.679443359375, -0.6306610107421875, -0.581878662109375, -0.5330963134765625, -0.48431396484375, -0.4355316162109375, -0.386749267578125, -0.3379669189453125, -0.2891845703125, -0.2404022216796875, -0.191619873046875, -0.1428375244140625, -0.09405517578125, -0.0452728271484375, 0.003509521484375, 0.0522918701171875, 0.10107421875, 0.1498565673828125, 0.198638916015625, 0.2474212646484375, 0.29620361328125, 0.3449859619140625, 0.393768310546875, 0.4425506591796875, 0.4913330078125, 0.5401153564453125, 0.588897705078125, 0.6376800537109375, 0.68646240234375, 0.7352447509765625, 0.784027099609375, 0.8328094482421875, 0.881591796875, 0.9303741455078125, 0.979156494140625, 1.0279388427734375, 1.07672119140625, 1.1255035400390625, 1.174285888671875, 1.2230682373046875, 1.2718505859375, 1.3206329345703125, 1.369415283203125, 1.4181976318359375, 1.46697998046875, 1.5157623291015625, 1.564544677734375, 1.6133270263671875, 1.662109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 11.0, 10.0, 17.0, 39.0, 62.0, 110.0, 177.0, 329.0, 598.0, 1177.0, 2503.0, 6954.0, 28276.0, 647902.0, 328059.0, 21957.0, 5847.0, 2275.0, 1039.0, 524.0, 285.0, 154.0, 100.0, 53.0, 24.0, 15.0, 18.0, 5.0, 2.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9147567749023438, -0.8851776123046875, -0.8555984497070312, -0.826019287109375, -0.7964401245117188, -0.7668609619140625, -0.7372817993164062, -0.70770263671875, -0.6781234741210938, -0.6485443115234375, -0.6189651489257812, -0.589385986328125, -0.5598068237304688, -0.5302276611328125, -0.5006484985351562, -0.4710693359375, -0.44149017333984375, -0.4119110107421875, -0.38233184814453125, -0.352752685546875, -0.32317352294921875, -0.2935943603515625, -0.26401519775390625, -0.23443603515625, -0.20485687255859375, -0.1752777099609375, -0.14569854736328125, -0.116119384765625, -0.08654022216796875, -0.0569610595703125, -0.02738189697265625, 0.002197265625, 0.03177642822265625, 0.0613555908203125, 0.09093475341796875, 0.120513916015625, 0.15009307861328125, 0.1796722412109375, 0.20925140380859375, 0.23883056640625, 0.26840972900390625, 0.2979888916015625, 0.32756805419921875, 0.357147216796875, 0.38672637939453125, 0.4163055419921875, 0.44588470458984375, 0.4754638671875, 0.5050430297851562, 0.5346221923828125, 0.5642013549804688, 0.593780517578125, 0.6233596801757812, 0.6529388427734375, 0.6825180053710938, 0.71209716796875, 0.7416763305664062, 0.7712554931640625, 0.8008346557617188, 0.830413818359375, 0.8599929809570312, 0.8895721435546875, 0.9191513061523438, 0.94873046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 11.0, 21.0, 28.0, 30.0, 65.0, 98.0, 138.0, 190.0, 136.0, 99.0, 41.0, 28.0, 22.0, 13.0, 14.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.052587509155273e-05, -7.837172597646713e-05, -7.621757686138153e-05, -7.406342774629593e-05, -7.190927863121033e-05, -6.975512951612473e-05, -6.760098040103912e-05, -6.544683128595352e-05, -6.329268217086792e-05, -6.113853305578232e-05, -5.8984383940696716e-05, -5.6830234825611115e-05, -5.467608571052551e-05, -5.252193659543991e-05, -5.036778748035431e-05, -4.821363836526871e-05, -4.6059489250183105e-05, -4.3905340135097504e-05, -4.17511910200119e-05, -3.95970419049263e-05, -3.74428927898407e-05, -3.5288743674755096e-05, -3.3134594559669495e-05, -3.098044544458389e-05, -2.882629632949829e-05, -2.667214721441269e-05, -2.4517998099327087e-05, -2.2363848984241486e-05, -2.0209699869155884e-05, -1.8055550754070282e-05, -1.590140163898468e-05, -1.3747252523899078e-05, -1.1593103408813477e-05, -9.438954293727875e-06, -7.284805178642273e-06, -5.130656063556671e-06, -2.9765069484710693e-06, -8.223578333854675e-07, 1.3317912817001343e-06, 3.485940396785736e-06, 5.640089511871338e-06, 7.79423862695694e-06, 9.948387742042542e-06, 1.2102536857128143e-05, 1.4256685972213745e-05, 1.6410835087299347e-05, 1.856498420238495e-05, 2.071913331747055e-05, 2.2873282432556152e-05, 2.5027431547641754e-05, 2.7181580662727356e-05, 2.9335729777812958e-05, 3.148987889289856e-05, 3.364402800798416e-05, 3.579817712306976e-05, 3.7952326238155365e-05, 4.010647535324097e-05, 4.226062446832657e-05, 4.441477358341217e-05, 4.656892269849777e-05, 4.8723071813583374e-05, 5.0877220928668976e-05, 5.303137004375458e-05, 5.518551915884018e-05, 5.733966827392578e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 13.0, 24.0, 43.0, 77.0, 193.0, 522.0, 1807.0, 9182.0, 739834.0, 287583.0, 7055.0, 1444.0, 440.0, 149.0, 73.0, 33.0, 22.0, 17.0, 9.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.707489013671875, -1.65716552734375, -1.606842041015625, -1.5565185546875, -1.506195068359375, -1.45587158203125, -1.405548095703125, -1.355224609375, -1.304901123046875, -1.25457763671875, -1.204254150390625, -1.1539306640625, -1.103607177734375, -1.05328369140625, -1.002960205078125, -0.95263671875, -0.902313232421875, -0.85198974609375, -0.801666259765625, -0.7513427734375, -0.701019287109375, -0.65069580078125, -0.600372314453125, -0.550048828125, -0.499725341796875, -0.44940185546875, -0.399078369140625, -0.3487548828125, -0.298431396484375, -0.24810791015625, -0.197784423828125, -0.1474609375, -0.097137451171875, -0.04681396484375, 0.003509521484375, 0.0538330078125, 0.104156494140625, 0.15447998046875, 0.204803466796875, 0.255126953125, 0.305450439453125, 0.35577392578125, 0.406097412109375, 0.4564208984375, 0.506744384765625, 0.55706787109375, 0.607391357421875, 0.65771484375, 0.708038330078125, 0.75836181640625, 0.808685302734375, 0.8590087890625, 0.909332275390625, 0.95965576171875, 1.009979248046875, 1.060302734375, 1.110626220703125, 1.16094970703125, 1.211273193359375, 1.2615966796875, 1.311920166015625, 1.36224365234375, 1.412567138671875, 1.462890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 4.0, 12.0, 19.0, 28.0, 39.0, 64.0, 112.0, 155.0, 180.0, 134.0, 88.0, 45.0, 22.0, 21.0, 21.0, 9.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85693359375, -0.8319168090820312, -0.8069000244140625, -0.7818832397460938, -0.756866455078125, -0.7318496704101562, -0.7068328857421875, -0.6818161010742188, -0.65679931640625, -0.6317825317382812, -0.6067657470703125, -0.5817489624023438, -0.556732177734375, -0.5317153930664062, -0.5066986083984375, -0.48168182373046875, -0.4566650390625, -0.43164825439453125, -0.4066314697265625, -0.38161468505859375, -0.356597900390625, -0.33158111572265625, -0.3065643310546875, -0.28154754638671875, -0.25653076171875, -0.23151397705078125, -0.2064971923828125, -0.18148040771484375, -0.156463623046875, -0.13144683837890625, -0.1064300537109375, -0.08141326904296875, -0.056396484375, -0.03137969970703125, -0.0063629150390625, 0.01865386962890625, 0.043670654296875, 0.06868743896484375, 0.0937042236328125, 0.11872100830078125, 0.14373779296875, 0.16875457763671875, 0.1937713623046875, 0.21878814697265625, 0.243804931640625, 0.26882171630859375, 0.2938385009765625, 0.31885528564453125, 0.3438720703125, 0.36888885498046875, 0.3939056396484375, 0.41892242431640625, 0.443939208984375, 0.46895599365234375, 0.4939727783203125, 0.5189895629882812, 0.54400634765625, 0.5690231323242188, 0.5940399169921875, 0.6190567016601562, 0.644073486328125, 0.6690902709960938, 0.6941070556640625, 0.7191238403320312, 0.744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 41.0, 99.0, 383.0, 328.0, 86.0, 35.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.99549865722656, -43.13209915161133, -42.268699645996094, -41.405303955078125, -40.54190444946289, -39.678504943847656, -38.81510543823242, -37.95170593261719, -37.08831024169922, -36.224910736083984, -35.36151123046875, -34.49811553955078, -33.63471603393555, -32.77131652832031, -31.907917022705078, -31.044519424438477, -30.181119918823242, -29.317720413208008, -28.454322814941406, -27.590923309326172, -26.72752571105957, -25.864126205444336, -25.000728607177734, -24.1373291015625, -23.273929595947266, -22.41053009033203, -21.54713249206543, -20.683732986450195, -19.820335388183594, -18.95693588256836, -18.093536376953125, -17.230138778686523, -16.366741180419922, -15.503342628479004, -14.639944076538086, -13.776544570922852, -12.91314697265625, -12.049747467041016, -11.186348915100098, -10.32295036315918, -9.459550857543945, -8.596152305603027, -7.732753753662109, -6.869354724884033, -6.005956172943115, -5.142557621002197, -4.279158592224121, -3.415760040283203, -2.552361488342285, -1.6889628171920776, -0.8255641460418701, 0.03783464431762695, 0.9012331962585449, 1.764631748199463, 2.628030776977539, 3.491429328918457, 4.354827880859375, 5.218226432800293, 6.081624984741211, 6.945024013519287, 7.808422565460205, 8.671821594238281, 9.5352201461792, 10.398618698120117, 11.262017250061035]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 8.0, 11.0, 18.0, 26.0, 13.0, 14.0, 30.0, 21.0, 30.0, 38.0, 34.0, 40.0, 34.0, 42.0, 45.0, 36.0, 48.0, 34.0, 31.0, 41.0, 37.0, 42.0, 39.0, 32.0, 31.0, 25.0, 26.0, 31.0, 23.0, 17.0, 17.0, 14.0, 10.0, 10.0, 10.0, 1.0, 7.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.0648722648620605, -6.840939998626709, -6.617007255554199, -6.393074989318848, -6.169142723083496, -5.9452104568481445, -5.721277713775635, -5.497345447540283, -5.273412704467773, -5.049480438232422, -4.825547695159912, -4.6016154289245605, -4.377683162689209, -4.153750419616699, -3.9298181533813477, -3.705885887145996, -3.4819536209106445, -3.258021116256714, -3.0340888500213623, -2.8101563453674316, -2.58622407913208, -2.3622915744781494, -2.1383590698242188, -1.9144266843795776, -1.6904942989349365, -1.4665619134902954, -1.2426295280456543, -1.0186970233917236, -0.7947646379470825, -0.5708322525024414, -0.34689974784851074, -0.12296736240386963, 0.10096454620361328, 0.3248969614505768, 0.5488293766975403, 0.7727618217468262, 0.9966942071914673, 1.2206265926361084, 1.444559097290039, 1.6684914827346802, 1.8924238681793213, 2.116356372833252, 2.3402886390686035, 2.564221143722534, 2.788153648376465, 3.0120859146118164, 3.236018419265747, 3.4599509239196777, 3.6838831901550293, 3.90781569480896, 4.131748199462891, 4.355680465698242, 4.579612731933594, 4.803544998168945, 5.027477741241455, 5.251410007476807, 5.475342750549316, 5.699275016784668, 5.923207759857178, 6.147140026092529, 6.371072292327881, 6.595005035400391, 6.818937301635742, 7.042869567871094, 7.266801834106445]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 11.0, 20.0, 18.0, 24.0, 35.0, 51.0, 67.0, 139.0, 242.0, 502.0, 1150.0, 2639.0, 7669.0, 39533.0, 3961892.0, 156422.0, 16643.0, 4222.0, 1574.0, 714.0, 317.0, 178.0, 83.0, 48.0, 28.0, 12.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.640625, -3.561065673828125, -3.48150634765625, -3.401947021484375, -3.3223876953125, -3.242828369140625, -3.16326904296875, -3.083709716796875, -3.004150390625, -2.924591064453125, -2.84503173828125, -2.765472412109375, -2.6859130859375, -2.606353759765625, -2.52679443359375, -2.447235107421875, -2.36767578125, -2.288116455078125, -2.20855712890625, -2.128997802734375, -2.0494384765625, -1.969879150390625, -1.89031982421875, -1.810760498046875, -1.731201171875, -1.651641845703125, -1.57208251953125, -1.492523193359375, -1.4129638671875, -1.333404541015625, -1.25384521484375, -1.174285888671875, -1.0947265625, -1.015167236328125, -0.93560791015625, -0.856048583984375, -0.7764892578125, -0.696929931640625, -0.61737060546875, -0.537811279296875, -0.458251953125, -0.378692626953125, -0.29913330078125, -0.219573974609375, -0.1400146484375, -0.060455322265625, 0.01910400390625, 0.098663330078125, 0.17822265625, 0.257781982421875, 0.33734130859375, 0.416900634765625, 0.4964599609375, 0.576019287109375, 0.65557861328125, 0.735137939453125, 0.814697265625, 0.894256591796875, 0.97381591796875, 1.053375244140625, 1.1329345703125, 1.212493896484375, 1.29205322265625, 1.371612548828125, 1.451171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 14.0, 23.0, 51.0, 64.0, 67.0, 70.0, 98.0, 88.0, 102.0, 108.0, 94.0, 61.0, 60.0, 27.0, 29.0, 17.0, 11.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7958984375, -0.7785758972167969, -0.7612533569335938, -0.7439308166503906, -0.7266082763671875, -0.7092857360839844, -0.6919631958007812, -0.6746406555175781, -0.657318115234375, -0.6399955749511719, -0.6226730346679688, -0.6053504943847656, -0.5880279541015625, -0.5707054138183594, -0.5533828735351562, -0.5360603332519531, -0.51873779296875, -0.5014152526855469, -0.48409271240234375, -0.4667701721191406, -0.4494476318359375, -0.4321250915527344, -0.41480255126953125, -0.3974800109863281, -0.380157470703125, -0.3628349304199219, -0.34551239013671875, -0.3281898498535156, -0.3108673095703125, -0.2935447692871094, -0.27622222900390625, -0.2588996887207031, -0.2415771484375, -0.22425460815429688, -0.20693206787109375, -0.18960952758789062, -0.1722869873046875, -0.15496444702148438, -0.13764190673828125, -0.12031936645507812, -0.102996826171875, -0.08567428588867188, -0.06835174560546875, -0.051029205322265625, -0.0337066650390625, -0.016384124755859375, 0.00093841552734375, 0.018260955810546875, 0.03558349609375, 0.052906036376953125, 0.07022857666015625, 0.08755111694335938, 0.1048736572265625, 0.12219619750976562, 0.13951873779296875, 0.15684127807617188, 0.174163818359375, 0.19148635864257812, 0.20880889892578125, 0.22613143920898438, 0.2434539794921875, 0.2607765197753906, 0.27809906005859375, 0.2954216003417969, 0.312744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 15.0, 19.0, 19.0, 31.0, 51.0, 80.0, 133.0, 167.0, 271.0, 407.0, 686.0, 1134.0, 2009.0, 3732.0, 7749.0, 18883.0, 67658.0, 2933291.0, 1060787.0, 62977.0, 18255.0, 7378.0, 3512.0, 1960.0, 1102.0, 700.0, 424.0, 275.0, 181.0, 125.0, 84.0, 50.0, 38.0, 26.0, 16.0, 10.0, 10.0, 8.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.4951171875, -1.454681396484375, -1.41424560546875, -1.373809814453125, -1.3333740234375, -1.292938232421875, -1.25250244140625, -1.212066650390625, -1.171630859375, -1.131195068359375, -1.09075927734375, -1.050323486328125, -1.0098876953125, -0.969451904296875, -0.92901611328125, -0.888580322265625, -0.84814453125, -0.807708740234375, -0.76727294921875, -0.726837158203125, -0.6864013671875, -0.645965576171875, -0.60552978515625, -0.565093994140625, -0.524658203125, -0.484222412109375, -0.44378662109375, -0.403350830078125, -0.3629150390625, -0.322479248046875, -0.28204345703125, -0.241607666015625, -0.201171875, -0.160736083984375, -0.12030029296875, -0.079864501953125, -0.0394287109375, 0.001007080078125, 0.04144287109375, 0.081878662109375, 0.122314453125, 0.162750244140625, 0.20318603515625, 0.243621826171875, 0.2840576171875, 0.324493408203125, 0.36492919921875, 0.405364990234375, 0.44580078125, 0.486236572265625, 0.52667236328125, 0.567108154296875, 0.6075439453125, 0.647979736328125, 0.68841552734375, 0.728851318359375, 0.769287109375, 0.809722900390625, 0.85015869140625, 0.890594482421875, 0.9310302734375, 0.971466064453125, 1.01190185546875, 1.052337646484375, 1.0927734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 9.0, 5.0, 15.0, 15.0, 31.0, 62.0, 83.0, 162.0, 2696.0, 532.0, 169.0, 87.0, 60.0, 27.0, 18.0, 24.0, 13.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6350479125976562, -0.6104278564453125, -0.5858078002929688, -0.561187744140625, -0.5365676879882812, -0.5119476318359375, -0.48732757568359375, -0.46270751953125, -0.43808746337890625, -0.4134674072265625, -0.38884735107421875, -0.364227294921875, -0.33960723876953125, -0.3149871826171875, -0.29036712646484375, -0.2657470703125, -0.24112701416015625, -0.2165069580078125, -0.19188690185546875, -0.167266845703125, -0.14264678955078125, -0.1180267333984375, -0.09340667724609375, -0.06878662109375, -0.04416656494140625, -0.0195465087890625, 0.00507354736328125, 0.029693603515625, 0.05431365966796875, 0.0789337158203125, 0.10355377197265625, 0.128173828125, 0.15279388427734375, 0.1774139404296875, 0.20203399658203125, 0.226654052734375, 0.25127410888671875, 0.2758941650390625, 0.30051422119140625, 0.32513427734375, 0.34975433349609375, 0.3743743896484375, 0.39899444580078125, 0.423614501953125, 0.44823455810546875, 0.4728546142578125, 0.49747467041015625, 0.5220947265625, 0.5467147827148438, 0.5713348388671875, 0.5959548950195312, 0.620574951171875, 0.6451950073242188, 0.6698150634765625, 0.6944351196289062, 0.71905517578125, 0.7436752319335938, 0.7682952880859375, 0.7929153442382812, 0.817535400390625, 0.8421554565429688, 0.8667755126953125, 0.8913955688476562, 0.916015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 9.0, 23.0, 38.0, 107.0, 216.0, 254.0, 151.0, 98.0, 44.0, 19.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4229354858398438, -3.2424254417419434, -3.061915636062622, -2.8814055919647217, -2.7008957862854004, -2.5203857421875, -2.3398756980895996, -2.1593658924102783, -1.9788559675216675, -1.7983460426330566, -1.6178361177444458, -1.437326192855835, -1.2568161487579346, -1.0763063430786133, -0.8957962989807129, -0.715286374092102, -0.5347764492034912, -0.35426652431488037, -0.17375656962394714, 0.006753385066986084, 0.18726330995559692, 0.36777323484420776, 0.5482832193374634, 0.7287931442260742, 0.9093030691146851, 1.089812994003296, 1.2703229188919067, 1.4508328437805176, 1.631342887878418, 1.8118526935577393, 1.9923627376556396, 2.172872543334961, 2.3533825874328613, 2.5338926315307617, 2.714402437210083, 2.8949124813079834, 3.0754222869873047, 3.255932331085205, 3.4364423751831055, 3.6169521808624268, 3.797461986541748, 3.9779720306396484, 4.158482074737549, 4.338991641998291, 4.519501686096191, 4.700011730194092, 4.880521774291992, 5.061031341552734, 5.241541862487793, 5.422051906585693, 5.602561950683594, 5.783071517944336, 5.963581562042236, 6.144091606140137, 6.324601650238037, 6.5051116943359375, 6.68562126159668, 6.86613130569458, 7.0466413497924805, 7.227150917053223, 7.407660961151123, 7.588171005249023, 7.768681049346924, 7.949191093444824, 8.129700660705566]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 13.0, 21.0, 32.0, 25.0, 34.0, 35.0, 33.0, 51.0, 50.0, 62.0, 61.0, 70.0, 47.0, 56.0, 50.0, 60.0, 36.0, 48.0, 37.0, 33.0, 29.0, 30.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.947227954864502, -2.8547418117523193, -2.7622554302215576, -2.669769287109375, -2.5772831439971924, -2.4847970008850098, -2.392310619354248, -2.2998244762420654, -2.207338333129883, -2.1148521900177, -2.0223658084869385, -1.9298796653747559, -1.8373935222625732, -1.744907259941101, -1.652420997619629, -1.5599348545074463, -1.4674485921859741, -1.374962329864502, -1.2824761867523193, -1.1899899244308472, -1.0975037813186646, -1.0050175189971924, -0.912531316280365, -0.8200451135635376, -0.7275589108467102, -0.6350727081298828, -0.5425865054130554, -0.45010027289390564, -0.35761407017707825, -0.26512786746025085, -0.17264163494110107, -0.08015543222427368, 0.012330770492553711, 0.1048169806599617, 0.1973031908273697, 0.2897894084453583, 0.38227561116218567, 0.47476181387901306, 0.5672480463981628, 0.6597342491149902, 0.7522204518318176, 0.844706654548645, 0.9371928572654724, 1.0296790599822998, 1.122165322303772, 1.2146514654159546, 1.3071377277374268, 1.3996238708496094, 1.4921101331710815, 1.5845963954925537, 1.6770825386047363, 1.7695688009262085, 1.8620549440383911, 1.9545412063598633, 2.047027349472046, 2.1395134925842285, 2.2319998741149902, 2.324486017227173, 2.4169723987579346, 2.509458541870117, 2.6019446849823, 2.6944308280944824, 2.786917209625244, 2.8794033527374268, 2.9718894958496094]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 9.0, 16.0, 11.0, 26.0, 42.0, 44.0, 62.0, 94.0, 171.0, 429.0, 902.0, 2186.0, 6167.0, 23313.0, 103050.0, 620274.0, 232183.0, 42574.0, 11164.0, 3366.0, 1298.0, 566.0, 239.0, 117.0, 74.0, 49.0, 39.0, 23.0, 15.0, 12.0, 8.0, 6.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.208984375, -2.145355224609375, -2.08172607421875, -2.018096923828125, -1.9544677734375, -1.890838623046875, -1.82720947265625, -1.763580322265625, -1.699951171875, -1.636322021484375, -1.57269287109375, -1.509063720703125, -1.4454345703125, -1.381805419921875, -1.31817626953125, -1.254547119140625, -1.19091796875, -1.127288818359375, -1.06365966796875, -1.000030517578125, -0.9364013671875, -0.872772216796875, -0.80914306640625, -0.745513916015625, -0.681884765625, -0.618255615234375, -0.55462646484375, -0.490997314453125, -0.4273681640625, -0.363739013671875, -0.30010986328125, -0.236480712890625, -0.1728515625, -0.109222412109375, -0.04559326171875, 0.018035888671875, 0.0816650390625, 0.145294189453125, 0.20892333984375, 0.272552490234375, 0.336181640625, 0.399810791015625, 0.46343994140625, 0.527069091796875, 0.5906982421875, 0.654327392578125, 0.71795654296875, 0.781585693359375, 0.84521484375, 0.908843994140625, 0.97247314453125, 1.036102294921875, 1.0997314453125, 1.163360595703125, 1.22698974609375, 1.290618896484375, 1.354248046875, 1.417877197265625, 1.48150634765625, 1.545135498046875, 1.6087646484375, 1.672393798828125, 1.73602294921875, 1.799652099609375, 1.86328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 10.0, 12.0, 31.0, 46.0, 57.0, 65.0, 73.0, 66.0, 95.0, 100.0, 98.0, 90.0, 69.0, 57.0, 32.0, 29.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.73114013671875, -0.7142333984375, -0.69732666015625, -0.680419921875, -0.66351318359375, -0.6466064453125, -0.62969970703125, -0.61279296875, -0.59588623046875, -0.5789794921875, -0.56207275390625, -0.545166015625, -0.52825927734375, -0.5113525390625, -0.49444580078125, -0.4775390625, -0.46063232421875, -0.4437255859375, -0.42681884765625, -0.409912109375, -0.39300537109375, -0.3760986328125, -0.35919189453125, -0.34228515625, -0.32537841796875, -0.3084716796875, -0.29156494140625, -0.274658203125, -0.25775146484375, -0.2408447265625, -0.22393798828125, -0.20703125, -0.19012451171875, -0.1732177734375, -0.15631103515625, -0.139404296875, -0.12249755859375, -0.1055908203125, -0.08868408203125, -0.07177734375, -0.05487060546875, -0.0379638671875, -0.02105712890625, -0.004150390625, 0.01275634765625, 0.0296630859375, 0.04656982421875, 0.0634765625, 0.08038330078125, 0.0972900390625, 0.11419677734375, 0.131103515625, 0.14801025390625, 0.1649169921875, 0.18182373046875, 0.19873046875, 0.21563720703125, 0.2325439453125, 0.24945068359375, 0.266357421875, 0.28326416015625, 0.3001708984375, 0.31707763671875, 0.333984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 6.0, 4.0, 14.0, 8.0, 21.0, 27.0, 38.0, 60.0, 79.0, 99.0, 195.0, 286.0, 451.0, 783.0, 1396.0, 2670.0, 5758.0, 13439.0, 36128.0, 117413.0, 521079.0, 248490.0, 61800.0, 21377.0, 8691.0, 3762.0, 1878.0, 996.0, 559.0, 367.0, 222.0, 165.0, 93.0, 72.0, 42.0, 29.0, 16.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5145111083984375, -1.463592529296875, -1.4126739501953125, -1.36175537109375, -1.3108367919921875, -1.259918212890625, -1.2089996337890625, -1.1580810546875, -1.1071624755859375, -1.056243896484375, -1.0053253173828125, -0.95440673828125, -0.9034881591796875, -0.852569580078125, -0.8016510009765625, -0.750732421875, -0.6998138427734375, -0.648895263671875, -0.5979766845703125, -0.54705810546875, -0.4961395263671875, -0.445220947265625, -0.3943023681640625, -0.3433837890625, -0.2924652099609375, -0.241546630859375, -0.1906280517578125, -0.13970947265625, -0.0887908935546875, -0.037872314453125, 0.0130462646484375, 0.06396484375, 0.1148834228515625, 0.165802001953125, 0.2167205810546875, 0.26763916015625, 0.3185577392578125, 0.369476318359375, 0.4203948974609375, 0.4713134765625, 0.5222320556640625, 0.573150634765625, 0.6240692138671875, 0.67498779296875, 0.7259063720703125, 0.776824951171875, 0.8277435302734375, 0.878662109375, 0.9295806884765625, 0.980499267578125, 1.0314178466796875, 1.08233642578125, 1.1332550048828125, 1.184173583984375, 1.2350921630859375, 1.2860107421875, 1.3369293212890625, 1.387847900390625, 1.4387664794921875, 1.48968505859375, 1.5406036376953125, 1.591522216796875, 1.6424407958984375, 1.693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 18.0, 16.0, 17.0, 26.0, 27.0, 35.0, 39.0, 38.0, 41.0, 49.0, 54.0, 54.0, 54.0, 48.0, 52.0, 59.0, 46.0, 41.0, 46.0, 45.0, 36.0, 28.0, 26.0, 17.0, 13.0, 12.0, 10.0, 10.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.288116455078125, -2.21881103515625, -2.149505615234375, -2.0802001953125, -2.010894775390625, -1.94158935546875, -1.872283935546875, -1.802978515625, -1.733673095703125, -1.66436767578125, -1.595062255859375, -1.5257568359375, -1.456451416015625, -1.38714599609375, -1.317840576171875, -1.24853515625, -1.179229736328125, -1.10992431640625, -1.040618896484375, -0.9713134765625, -0.902008056640625, -0.83270263671875, -0.763397216796875, -0.694091796875, -0.624786376953125, -0.55548095703125, -0.486175537109375, -0.4168701171875, -0.347564697265625, -0.27825927734375, -0.208953857421875, -0.1396484375, -0.070343017578125, -0.00103759765625, 0.068267822265625, 0.1375732421875, 0.206878662109375, 0.27618408203125, 0.345489501953125, 0.414794921875, 0.484100341796875, 0.55340576171875, 0.622711181640625, 0.6920166015625, 0.761322021484375, 0.83062744140625, 0.899932861328125, 0.96923828125, 1.038543701171875, 1.10784912109375, 1.177154541015625, 1.2464599609375, 1.315765380859375, 1.38507080078125, 1.454376220703125, 1.523681640625, 1.592987060546875, 1.66229248046875, 1.731597900390625, 1.8009033203125, 1.870208740234375, 1.93951416015625, 2.008819580078125, 2.078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 18.0, 20.0, 43.0, 65.0, 96.0, 134.0, 256.0, 429.0, 812.0, 1680.0, 4412.0, 18028.0, 412152.0, 580704.0, 21186.0, 4701.0, 1813.0, 795.0, 457.0, 294.0, 161.0, 92.0, 58.0, 41.0, 27.0, 17.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4096832275390625, -1.359405517578125, -1.3091278076171875, -1.25885009765625, -1.2085723876953125, -1.158294677734375, -1.1080169677734375, -1.0577392578125, -1.0074615478515625, -0.957183837890625, -0.9069061279296875, -0.85662841796875, -0.8063507080078125, -0.756072998046875, -0.7057952880859375, -0.655517578125, -0.6052398681640625, -0.554962158203125, -0.5046844482421875, -0.45440673828125, -0.4041290283203125, -0.353851318359375, -0.3035736083984375, -0.2532958984375, -0.2030181884765625, -0.152740478515625, -0.1024627685546875, -0.05218505859375, -0.0019073486328125, 0.048370361328125, 0.0986480712890625, 0.14892578125, 0.1992034912109375, 0.249481201171875, 0.2997589111328125, 0.35003662109375, 0.4003143310546875, 0.450592041015625, 0.5008697509765625, 0.5511474609375, 0.6014251708984375, 0.651702880859375, 0.7019805908203125, 0.75225830078125, 0.8025360107421875, 0.852813720703125, 0.9030914306640625, 0.953369140625, 1.0036468505859375, 1.053924560546875, 1.1042022705078125, 1.15447998046875, 1.2047576904296875, 1.255035400390625, 1.3053131103515625, 1.3555908203125, 1.4058685302734375, 1.456146240234375, 1.5064239501953125, 1.55670166015625, 1.6069793701171875, 1.657257080078125, 1.7075347900390625, 1.7578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 17.0, 21.0, 50.0, 102.0, 162.0, 204.0, 171.0, 116.0, 54.0, 33.0, 14.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015350431203842163, -0.00014893710613250732, -0.00014436990022659302, -0.0001398026943206787, -0.0001352354884147644, -0.0001306682825088501, -0.0001261010766029358, -0.00012153387069702148, -0.00011696666479110718, -0.00011239945888519287, -0.00010783225297927856, -0.00010326504707336426, -9.869784116744995e-05, -9.413063526153564e-05, -8.956342935562134e-05, -8.499622344970703e-05, -8.042901754379272e-05, -7.586181163787842e-05, -7.129460573196411e-05, -6.67273998260498e-05, -6.21601939201355e-05, -5.759298801422119e-05, -5.3025782108306885e-05, -4.845857620239258e-05, -4.389137029647827e-05, -3.9324164390563965e-05, -3.475695848464966e-05, -3.018975257873535e-05, -2.5622546672821045e-05, -2.1055340766906738e-05, -1.648813486099243e-05, -1.1920928955078125e-05, -7.353723049163818e-06, -2.7865171432495117e-06, 1.780688762664795e-06, 6.3478946685791016e-06, 1.0915100574493408e-05, 1.5482306480407715e-05, 2.004951238632202e-05, 2.4616718292236328e-05, 2.9183924198150635e-05, 3.375113010406494e-05, 3.831833600997925e-05, 4.2885541915893555e-05, 4.745274782180786e-05, 5.201995372772217e-05, 5.6587159633636475e-05, 6.115436553955078e-05, 6.572157144546509e-05, 7.02887773513794e-05, 7.48559832572937e-05, 7.942318916320801e-05, 8.399039506912231e-05, 8.855760097503662e-05, 9.312480688095093e-05, 9.769201278686523e-05, 0.00010225921869277954, 0.00010682642459869385, 0.00011139363050460815, 0.00011596083641052246, 0.00012052804231643677, 0.00012509524822235107, 0.00012966245412826538, 0.0001342296600341797]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 10.0, 14.0, 23.0, 34.0, 61.0, 85.0, 130.0, 218.0, 368.0, 700.0, 1477.0, 3616.0, 11393.0, 83809.0, 848821.0, 80007.0, 11170.0, 3465.0, 1467.0, 692.0, 371.0, 213.0, 136.0, 89.0, 58.0, 25.0, 32.0, 14.0, 13.0, 12.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3203125, -1.283111572265625, -1.24591064453125, -1.208709716796875, -1.1715087890625, -1.134307861328125, -1.09710693359375, -1.059906005859375, -1.022705078125, -0.985504150390625, -0.94830322265625, -0.911102294921875, -0.8739013671875, -0.836700439453125, -0.79949951171875, -0.762298583984375, -0.72509765625, -0.687896728515625, -0.65069580078125, -0.613494873046875, -0.5762939453125, -0.539093017578125, -0.50189208984375, -0.464691162109375, -0.427490234375, -0.390289306640625, -0.35308837890625, -0.315887451171875, -0.2786865234375, -0.241485595703125, -0.20428466796875, -0.167083740234375, -0.1298828125, -0.092681884765625, -0.05548095703125, -0.018280029296875, 0.0189208984375, 0.056121826171875, 0.09332275390625, 0.130523681640625, 0.167724609375, 0.204925537109375, 0.24212646484375, 0.279327392578125, 0.3165283203125, 0.353729248046875, 0.39093017578125, 0.428131103515625, 0.46533203125, 0.502532958984375, 0.53973388671875, 0.576934814453125, 0.6141357421875, 0.651336669921875, 0.68853759765625, 0.725738525390625, 0.762939453125, 0.800140380859375, 0.83734130859375, 0.874542236328125, 0.9117431640625, 0.948944091796875, 0.98614501953125, 1.023345947265625, 1.060546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 10.0, 17.0, 26.0, 43.0, 66.0, 107.0, 219.0, 205.0, 119.0, 72.0, 35.0, 24.0, 12.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.25042724609375, -1.2039794921875, -1.15753173828125, -1.111083984375, -1.06463623046875, -1.0181884765625, -0.97174072265625, -0.92529296875, -0.87884521484375, -0.8323974609375, -0.78594970703125, -0.739501953125, -0.69305419921875, -0.6466064453125, -0.60015869140625, -0.5537109375, -0.50726318359375, -0.4608154296875, -0.41436767578125, -0.367919921875, -0.32147216796875, -0.2750244140625, -0.22857666015625, -0.18212890625, -0.13568115234375, -0.0892333984375, -0.04278564453125, 0.003662109375, 0.05010986328125, 0.0965576171875, 0.14300537109375, 0.189453125, 0.23590087890625, 0.2823486328125, 0.32879638671875, 0.375244140625, 0.42169189453125, 0.4681396484375, 0.51458740234375, 0.56103515625, 0.60748291015625, 0.6539306640625, 0.70037841796875, 0.746826171875, 0.79327392578125, 0.8397216796875, 0.88616943359375, 0.9326171875, 0.97906494140625, 1.0255126953125, 1.07196044921875, 1.118408203125, 1.16485595703125, 1.2113037109375, 1.25775146484375, 1.30419921875, 1.35064697265625, 1.3970947265625, 1.44354248046875, 1.489990234375, 1.53643798828125, 1.5828857421875, 1.62933349609375, 1.67578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 11.0, 16.0, 26.0, 52.0, 124.0, 225.0, 295.0, 138.0, 51.0, 33.0, 21.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.71803283691406, -41.811527252197266, -40.90502166748047, -39.99851608276367, -39.092010498046875, -38.18550491333008, -37.27899932861328, -36.372493743896484, -35.46598815917969, -34.55948257446289, -33.652976989746094, -32.7464714050293, -31.8399658203125, -30.933460235595703, -30.026954650878906, -29.12044906616211, -28.213943481445312, -27.307437896728516, -26.40093231201172, -25.494426727294922, -24.587921142578125, -23.681415557861328, -22.77490997314453, -21.868404388427734, -20.96190071105957, -20.055395126342773, -19.148889541625977, -18.24238395690918, -17.335878372192383, -16.429372787475586, -15.522867202758789, -14.616361618041992, -13.709855079650879, -12.803349494934082, -11.896843910217285, -10.990338325500488, -10.083832740783691, -9.177328109741211, -8.270822525024414, -7.364316463470459, -6.457810878753662, -5.551305294036865, -4.644799709320068, -3.7382943630218506, -2.8317887783050537, -1.925283432006836, -1.018777847290039, -0.11227226257324219, 0.7942333221435547, 1.7007389068603516, 2.6072444915771484, 3.513749837875366, 4.420255661010742, 5.326760768890381, 6.233266353607178, 7.139771938323975, 8.04627799987793, 8.952783584594727, 9.859289169311523, 10.76579475402832, 11.672300338745117, 12.578805923461914, 13.485311508178711, 14.391817092895508, 15.298321723937988]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 12.0, 12.0, 7.0, 10.0, 12.0, 21.0, 13.0, 26.0, 21.0, 29.0, 28.0, 26.0, 30.0, 59.0, 48.0, 47.0, 48.0, 51.0, 59.0, 52.0, 55.0, 45.0, 37.0, 31.0, 38.0, 38.0, 20.0, 26.0, 15.0, 17.0, 17.0, 6.0, 12.0, 4.0, 3.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.458839416503906, -14.010566711425781, -13.562294006347656, -13.114022254943848, -12.665749549865723, -12.217476844787598, -11.769204139709473, -11.320932388305664, -10.872659683227539, -10.424386978149414, -9.976114273071289, -9.52784252166748, -9.079569816589355, -8.63129711151123, -8.183024406433105, -7.734752178192139, -7.286479473114014, -6.838206768035889, -6.389934539794922, -5.941661834716797, -5.49338960647583, -5.045116901397705, -4.596844673156738, -4.148571968078613, -3.7002995014190674, -3.2520270347595215, -2.8037545680999756, -2.3554821014404297, -1.9072095155715942, -1.4589369297027588, -1.010664463043213, -0.562391996383667, -0.1141195297241211, 0.3341529667377472, 0.7824254631996155, 1.2306979894638062, 1.678970456123352, 2.1272430419921875, 2.5755155086517334, 3.0237879753112793, 3.472060441970825, 3.920332908630371, 4.368605613708496, 4.816877841949463, 5.265150547027588, 5.713422775268555, 6.16169548034668, 6.609968185424805, 7.0582404136657715, 7.5065131187438965, 7.954785346984863, 8.403058052062988, 8.851330757141113, 9.299602508544922, 9.747875213623047, 10.196147918701172, 10.644420623779297, 11.092693328857422, 11.540966033935547, 11.989237785339355, 12.43751049041748, 12.885783195495605, 13.33405590057373, 13.782327651977539, 14.230600357055664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 14.0, 14.0, 21.0, 26.0, 28.0, 69.0, 93.0, 148.0, 251.0, 389.0, 635.0, 1131.0, 2186.0, 4513.0, 20267.0, 4144184.0, 12124.0, 3813.0, 1863.0, 1048.0, 554.0, 328.0, 213.0, 131.0, 73.0, 63.0, 33.0, 20.0, 16.0, 6.0, 12.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.703125, -4.5894775390625, -4.475830078125, -4.3621826171875, -4.24853515625, -4.1348876953125, -4.021240234375, -3.9075927734375, -3.7939453125, -3.6802978515625, -3.566650390625, -3.4530029296875, -3.33935546875, -3.2257080078125, -3.112060546875, -2.9984130859375, -2.884765625, -2.7711181640625, -2.657470703125, -2.5438232421875, -2.43017578125, -2.3165283203125, -2.202880859375, -2.0892333984375, -1.9755859375, -1.8619384765625, -1.748291015625, -1.6346435546875, -1.52099609375, -1.4073486328125, -1.293701171875, -1.1800537109375, -1.06640625, -0.9527587890625, -0.839111328125, -0.7254638671875, -0.61181640625, -0.4981689453125, -0.384521484375, -0.2708740234375, -0.1572265625, -0.0435791015625, 0.070068359375, 0.1837158203125, 0.29736328125, 0.4110107421875, 0.524658203125, 0.6383056640625, 0.751953125, 0.8656005859375, 0.979248046875, 1.0928955078125, 1.20654296875, 1.3201904296875, 1.433837890625, 1.5474853515625, 1.6611328125, 1.7747802734375, 1.888427734375, 2.0020751953125, 2.11572265625, 2.2293701171875, 2.343017578125, 2.4566650390625, 2.5703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 8.0, 14.0, 15.0, 16.0, 22.0, 30.0, 45.0, 42.0, 62.0, 68.0, 60.0, 58.0, 72.0, 79.0, 81.0, 74.0, 57.0, 46.0, 37.0, 25.0, 24.0, 14.0, 4.0, 15.0, 10.0, 11.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7876091003417969, -0.7676010131835938, -0.7475929260253906, -0.7275848388671875, -0.7075767517089844, -0.6875686645507812, -0.6675605773925781, -0.647552490234375, -0.6275444030761719, -0.6075363159179688, -0.5875282287597656, -0.5675201416015625, -0.5475120544433594, -0.5275039672851562, -0.5074958801269531, -0.48748779296875, -0.4674797058105469, -0.44747161865234375, -0.4274635314941406, -0.4074554443359375, -0.3874473571777344, -0.36743927001953125, -0.3474311828613281, -0.327423095703125, -0.3074150085449219, -0.28740692138671875, -0.2673988342285156, -0.2473907470703125, -0.22738265991210938, -0.20737457275390625, -0.18736648559570312, -0.1673583984375, -0.14735031127929688, -0.12734222412109375, -0.10733413696289062, -0.0873260498046875, -0.06731796264648438, -0.04730987548828125, -0.027301788330078125, -0.007293701171875, 0.012714385986328125, 0.03272247314453125, 0.052730560302734375, 0.0727386474609375, 0.09274673461914062, 0.11275482177734375, 0.13276290893554688, 0.15277099609375, 0.17277908325195312, 0.19278717041015625, 0.21279525756835938, 0.2328033447265625, 0.2528114318847656, 0.27281951904296875, 0.2928276062011719, 0.312835693359375, 0.3328437805175781, 0.35285186767578125, 0.3728599548339844, 0.3928680419921875, 0.4128761291503906, 0.43288421630859375, 0.4528923034667969, 0.472900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 9.0, 18.0, 13.0, 27.0, 24.0, 41.0, 62.0, 84.0, 91.0, 145.0, 201.0, 282.0, 391.0, 609.0, 897.0, 1374.0, 2649.0, 5987.0, 19134.0, 4101665.0, 43373.0, 8800.0, 3402.0, 1735.0, 1022.0, 661.0, 446.0, 327.0, 199.0, 149.0, 125.0, 77.0, 65.0, 54.0, 35.0, 22.0, 21.0, 11.0, 14.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.926116943359375, -2.83074951171875, -2.735382080078125, -2.6400146484375, -2.544647216796875, -2.44927978515625, -2.353912353515625, -2.258544921875, -2.163177490234375, -2.06781005859375, -1.972442626953125, -1.8770751953125, -1.781707763671875, -1.68634033203125, -1.590972900390625, -1.49560546875, -1.400238037109375, -1.30487060546875, -1.209503173828125, -1.1141357421875, -1.018768310546875, -0.92340087890625, -0.828033447265625, -0.732666015625, -0.637298583984375, -0.54193115234375, -0.446563720703125, -0.3511962890625, -0.255828857421875, -0.16046142578125, -0.065093994140625, 0.0302734375, 0.125640869140625, 0.22100830078125, 0.316375732421875, 0.4117431640625, 0.507110595703125, 0.60247802734375, 0.697845458984375, 0.793212890625, 0.888580322265625, 0.98394775390625, 1.079315185546875, 1.1746826171875, 1.270050048828125, 1.36541748046875, 1.460784912109375, 1.55615234375, 1.651519775390625, 1.74688720703125, 1.842254638671875, 1.9376220703125, 2.032989501953125, 2.12835693359375, 2.223724365234375, 2.319091796875, 2.414459228515625, 2.50982666015625, 2.605194091796875, 2.7005615234375, 2.795928955078125, 2.89129638671875, 2.986663818359375, 3.08203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 9.0, 26.0, 100.0, 3799.0, 58.0, 20.0, 16.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6615142822265625, -0.640411376953125, -0.6193084716796875, -0.59820556640625, -0.5771026611328125, -0.555999755859375, -0.5348968505859375, -0.5137939453125, -0.4926910400390625, -0.471588134765625, -0.4504852294921875, -0.42938232421875, -0.4082794189453125, -0.387176513671875, -0.3660736083984375, -0.344970703125, -0.3238677978515625, -0.302764892578125, -0.2816619873046875, -0.26055908203125, -0.2394561767578125, -0.218353271484375, -0.1972503662109375, -0.1761474609375, -0.1550445556640625, -0.133941650390625, -0.1128387451171875, -0.09173583984375, -0.0706329345703125, -0.049530029296875, -0.0284271240234375, -0.00732421875, 0.0137786865234375, 0.034881591796875, 0.0559844970703125, 0.07708740234375, 0.0981903076171875, 0.119293212890625, 0.1403961181640625, 0.1614990234375, 0.1826019287109375, 0.203704833984375, 0.2248077392578125, 0.24591064453125, 0.2670135498046875, 0.288116455078125, 0.3092193603515625, 0.330322265625, 0.3514251708984375, 0.372528076171875, 0.3936309814453125, 0.41473388671875, 0.4358367919921875, 0.456939697265625, 0.4780426025390625, 0.4991455078125, 0.5202484130859375, 0.541351318359375, 0.5624542236328125, 0.58355712890625, 0.6046600341796875, 0.625762939453125, 0.6468658447265625, 0.66796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 9.0, 34.0, 69.0, 108.0, 244.0, 277.0, 154.0, 55.0, 29.0, 15.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.771570205688477, -5.6543707847595215, -5.537170886993408, -5.419971466064453, -5.30277156829834, -5.185572147369385, -5.0683722496032715, -4.951172828674316, -4.833972930908203, -4.716773509979248, -4.599573612213135, -4.48237419128418, -4.365174293518066, -4.247974872589111, -4.130774974822998, -4.013575553894043, -3.896376132965088, -3.7791764736175537, -3.6619768142700195, -3.5447771549224854, -3.427577495574951, -3.310378074645996, -3.193178415298462, -3.0759787559509277, -2.9587790966033936, -2.8415794372558594, -2.724379777908325, -2.607180118560791, -2.489980697631836, -2.3727807998657227, -2.2555813789367676, -2.1383817195892334, -2.0211822986602783, -1.9039826393127441, -1.78678297996521, -1.6695834398269653, -1.5523837804794312, -1.435184121131897, -1.3179845809936523, -1.2007849216461182, -1.083585262298584, -0.9663856029510498, -0.8491860032081604, -0.731986403465271, -0.6147867441177368, -0.49758708477020264, -0.38038748502731323, -0.26318788528442383, -0.14598822593688965, -0.028788596391677856, 0.08841103315353394, 0.20561066269874573, 0.3228102922439575, 0.4400099515914917, 0.5572095513343811, 0.6744091510772705, 0.7916088104248047, 0.9088084697723389, 1.026008129119873, 1.1432076692581177, 1.2604073286056519, 1.377606987953186, 1.4948065280914307, 1.6120061874389648, 1.729205846786499]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 13.0, 9.0, 17.0, 23.0, 26.0, 33.0, 30.0, 39.0, 33.0, 47.0, 43.0, 43.0, 46.0, 51.0, 36.0, 44.0, 52.0, 43.0, 37.0, 47.0, 29.0, 32.0, 32.0, 36.0, 24.0, 20.0, 19.0, 18.0, 9.0, 12.0, 10.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0555193424224854, -1.0179657936096191, -0.9804121255874634, -0.9428585767745972, -0.9053049683570862, -0.8677513599395752, -0.8301977515220642, -0.7926441431045532, -0.755090594291687, -0.717536985874176, -0.679983377456665, -0.6424298286437988, -0.6048762202262878, -0.5673226118087769, -0.5297690033912659, -0.49221542477607727, -0.4546617865562439, -0.4171081781387329, -0.3795545995235443, -0.3420009911060333, -0.3044474124908447, -0.26689380407333374, -0.22934019565582275, -0.19178661704063416, -0.15423300862312317, -0.11667941510677338, -0.07912581413984299, -0.0415722131729126, -0.004018619656562805, 0.03353497385978699, 0.07108858227729797, 0.10864216089248657, 0.14619576930999756, 0.18374936282634735, 0.22130295634269714, 0.25885656476020813, 0.29641014337539673, 0.3339637517929077, 0.3715173602104187, 0.4090709388256073, 0.4466245472431183, 0.4841781556606293, 0.5217317342758179, 0.5592853426933289, 0.5968389511108398, 0.634392499923706, 0.6719461679458618, 0.709499716758728, 0.747053325176239, 0.78460693359375, 0.822160542011261, 0.859714150428772, 0.8972676992416382, 0.9348213076591492, 0.9723749160766602, 1.0099284648895264, 1.0474821329116821, 1.0850356817245483, 1.122589349746704, 1.1601428985595703, 1.197696566581726, 1.2352501153945923, 1.272803783416748, 1.3103573322296143, 1.3479108810424805]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 1.0, 4.0, 8.0, 7.0, 18.0, 13.0, 28.0, 48.0, 61.0, 94.0, 140.0, 225.0, 352.0, 594.0, 1143.0, 2235.0, 4557.0, 9987.0, 25379.0, 76105.0, 303199.0, 449347.0, 114451.0, 35269.0, 13441.0, 5661.0, 2806.0, 1446.0, 784.0, 431.0, 245.0, 162.0, 114.0, 63.0, 48.0, 17.0, 26.0, 11.0, 9.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.95068359375, -1.8837890625, -1.81689453125, -1.75, -1.68310546875, -1.6162109375, -1.54931640625, -1.482421875, -1.41552734375, -1.3486328125, -1.28173828125, -1.21484375, -1.14794921875, -1.0810546875, -1.01416015625, -0.947265625, -0.88037109375, -0.8134765625, -0.74658203125, -0.6796875, -0.61279296875, -0.5458984375, -0.47900390625, -0.412109375, -0.34521484375, -0.2783203125, -0.21142578125, -0.14453125, -0.07763671875, -0.0107421875, 0.05615234375, 0.123046875, 0.18994140625, 0.2568359375, 0.32373046875, 0.390625, 0.45751953125, 0.5244140625, 0.59130859375, 0.658203125, 0.72509765625, 0.7919921875, 0.85888671875, 0.92578125, 0.99267578125, 1.0595703125, 1.12646484375, 1.193359375, 1.26025390625, 1.3271484375, 1.39404296875, 1.4609375, 1.52783203125, 1.5947265625, 1.66162109375, 1.728515625, 1.79541015625, 1.8623046875, 1.92919921875, 1.99609375, 2.06298828125, 2.1298828125, 2.19677734375, 2.263671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 1.0, 11.0, 12.0, 19.0, 18.0, 27.0, 34.0, 47.0, 53.0, 62.0, 48.0, 60.0, 62.0, 96.0, 57.0, 72.0, 64.0, 62.0, 40.0, 37.0, 25.0, 22.0, 17.0, 12.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.794921875, -0.7746047973632812, -0.7542877197265625, -0.7339706420898438, -0.713653564453125, -0.6933364868164062, -0.6730194091796875, -0.6527023315429688, -0.63238525390625, -0.6120681762695312, -0.5917510986328125, -0.5714340209960938, -0.551116943359375, -0.5307998657226562, -0.5104827880859375, -0.49016571044921875, -0.4698486328125, -0.44953155517578125, -0.4292144775390625, -0.40889739990234375, -0.388580322265625, -0.36826324462890625, -0.3479461669921875, -0.32762908935546875, -0.30731201171875, -0.28699493408203125, -0.2666778564453125, -0.24636077880859375, -0.226043701171875, -0.20572662353515625, -0.1854095458984375, -0.16509246826171875, -0.144775390625, -0.12445831298828125, -0.1041412353515625, -0.08382415771484375, -0.063507080078125, -0.04319000244140625, -0.0228729248046875, -0.00255584716796875, 0.01776123046875, 0.03807830810546875, 0.0583953857421875, 0.07871246337890625, 0.099029541015625, 0.11934661865234375, 0.1396636962890625, 0.15998077392578125, 0.1802978515625, 0.20061492919921875, 0.2209320068359375, 0.24124908447265625, 0.261566162109375, 0.28188323974609375, 0.3022003173828125, 0.32251739501953125, 0.34283447265625, 0.36315155029296875, 0.3834686279296875, 0.40378570556640625, 0.424102783203125, 0.44441986083984375, 0.4647369384765625, 0.48505401611328125, 0.50537109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 16.0, 17.0, 27.0, 36.0, 85.0, 98.0, 149.0, 294.0, 523.0, 953.0, 2032.0, 5184.0, 15470.0, 66025.0, 583324.0, 312444.0, 42767.0, 11543.0, 4028.0, 1659.0, 835.0, 409.0, 231.0, 131.0, 73.0, 60.0, 36.0, 36.0, 21.0, 13.0, 7.0, 12.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.841796875, -3.72491455078125, -3.6080322265625, -3.49114990234375, -3.374267578125, -3.25738525390625, -3.1405029296875, -3.02362060546875, -2.90673828125, -2.78985595703125, -2.6729736328125, -2.55609130859375, -2.439208984375, -2.32232666015625, -2.2054443359375, -2.08856201171875, -1.9716796875, -1.85479736328125, -1.7379150390625, -1.62103271484375, -1.504150390625, -1.38726806640625, -1.2703857421875, -1.15350341796875, -1.03662109375, -0.91973876953125, -0.8028564453125, -0.68597412109375, -0.569091796875, -0.45220947265625, -0.3353271484375, -0.21844482421875, -0.1015625, 0.01531982421875, 0.1322021484375, 0.24908447265625, 0.365966796875, 0.48284912109375, 0.5997314453125, 0.71661376953125, 0.83349609375, 0.95037841796875, 1.0672607421875, 1.18414306640625, 1.301025390625, 1.41790771484375, 1.5347900390625, 1.65167236328125, 1.7685546875, 1.88543701171875, 2.0023193359375, 2.11920166015625, 2.236083984375, 2.35296630859375, 2.4698486328125, 2.58673095703125, 2.70361328125, 2.82049560546875, 2.9373779296875, 3.05426025390625, 3.171142578125, 3.28802490234375, 3.4049072265625, 3.52178955078125, 3.638671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 19.0, 20.0, 27.0, 29.0, 43.0, 41.0, 65.0, 52.0, 62.0, 74.0, 63.0, 57.0, 65.0, 62.0, 48.0, 48.0, 42.0, 34.0, 21.0, 24.0, 17.0, 10.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.266265869140625, -3.12042236328125, -2.974578857421875, -2.8287353515625, -2.682891845703125, -2.53704833984375, -2.391204833984375, -2.245361328125, -2.099517822265625, -1.95367431640625, -1.807830810546875, -1.6619873046875, -1.516143798828125, -1.37030029296875, -1.224456787109375, -1.07861328125, -0.932769775390625, -0.78692626953125, -0.641082763671875, -0.4952392578125, -0.349395751953125, -0.20355224609375, -0.057708740234375, 0.088134765625, 0.233978271484375, 0.37982177734375, 0.525665283203125, 0.6715087890625, 0.817352294921875, 0.96319580078125, 1.109039306640625, 1.2548828125, 1.400726318359375, 1.54656982421875, 1.692413330078125, 1.8382568359375, 1.984100341796875, 2.12994384765625, 2.275787353515625, 2.421630859375, 2.567474365234375, 2.71331787109375, 2.859161376953125, 3.0050048828125, 3.150848388671875, 3.29669189453125, 3.442535400390625, 3.58837890625, 3.734222412109375, 3.88006591796875, 4.025909423828125, 4.1717529296875, 4.317596435546875, 4.46343994140625, 4.609283447265625, 4.755126953125, 4.900970458984375, 5.04681396484375, 5.192657470703125, 5.3385009765625, 5.484344482421875, 5.63018798828125, 5.776031494140625, 5.921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 10.0, 24.0, 40.0, 52.0, 72.0, 107.0, 188.0, 290.0, 488.0, 979.0, 2019.0, 5374.0, 21817.0, 297703.0, 675404.0, 32202.0, 6757.0, 2428.0, 1106.0, 587.0, 335.0, 197.0, 139.0, 52.0, 53.0, 31.0, 28.0, 13.0, 11.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.712890625, -2.6397705078125, -2.566650390625, -2.4935302734375, -2.42041015625, -2.3472900390625, -2.274169921875, -2.2010498046875, -2.1279296875, -2.0548095703125, -1.981689453125, -1.9085693359375, -1.83544921875, -1.7623291015625, -1.689208984375, -1.6160888671875, -1.54296875, -1.4698486328125, -1.396728515625, -1.3236083984375, -1.25048828125, -1.1773681640625, -1.104248046875, -1.0311279296875, -0.9580078125, -0.8848876953125, -0.811767578125, -0.7386474609375, -0.66552734375, -0.5924072265625, -0.519287109375, -0.4461669921875, -0.373046875, -0.2999267578125, -0.226806640625, -0.1536865234375, -0.08056640625, -0.0074462890625, 0.065673828125, 0.1387939453125, 0.2119140625, 0.2850341796875, 0.358154296875, 0.4312744140625, 0.50439453125, 0.5775146484375, 0.650634765625, 0.7237548828125, 0.796875, 0.8699951171875, 0.943115234375, 1.0162353515625, 1.08935546875, 1.1624755859375, 1.235595703125, 1.3087158203125, 1.3818359375, 1.4549560546875, 1.528076171875, 1.6011962890625, 1.67431640625, 1.7474365234375, 1.820556640625, 1.8936767578125, 1.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 11.0, 15.0, 37.0, 102.0, 219.0, 321.0, 163.0, 64.0, 29.0, 19.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047588348388671875, -0.00046237558126449585, -0.00044886767864227295, -0.00043535977602005005, -0.00042185187339782715, -0.00040834397077560425, -0.00039483606815338135, -0.00038132816553115845, -0.00036782026290893555, -0.00035431236028671265, -0.00034080445766448975, -0.00032729655504226685, -0.00031378865242004395, -0.00030028074979782104, -0.00028677284717559814, -0.00027326494455337524, -0.00025975704193115234, -0.00024624913930892944, -0.00023274123668670654, -0.00021923333406448364, -0.00020572543144226074, -0.00019221752882003784, -0.00017870962619781494, -0.00016520172357559204, -0.00015169382095336914, -0.00013818591833114624, -0.00012467801570892334, -0.00011117011308670044, -9.766221046447754e-05, -8.415430784225464e-05, -7.064640522003174e-05, -5.713850259780884e-05, -4.363059997558594e-05, -3.0122697353363037e-05, -1.6614794731140137e-05, -3.1068921089172363e-06, 1.0401010513305664e-05, 2.3908913135528564e-05, 3.7416815757751465e-05, 5.0924718379974365e-05, 6.443262100219727e-05, 7.794052362442017e-05, 9.144842624664307e-05, 0.00010495632886886597, 0.00011846423149108887, 0.00013197213411331177, 0.00014548003673553467, 0.00015898793935775757, 0.00017249584197998047, 0.00018600374460220337, 0.00019951164722442627, 0.00021301954984664917, 0.00022652745246887207, 0.00024003535509109497, 0.00025354325771331787, 0.00026705116033554077, 0.00028055906295776367, 0.00029406696557998657, 0.00030757486820220947, 0.0003210827708244324, 0.0003345906734466553, 0.0003480985760688782, 0.0003616064786911011, 0.000375114381313324, 0.0003886222839355469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 5.0, 12.0, 8.0, 12.0, 16.0, 29.0, 41.0, 41.0, 86.0, 115.0, 194.0, 315.0, 596.0, 1175.0, 2564.0, 6909.0, 26923.0, 236422.0, 701800.0, 53513.0, 10737.0, 3611.0, 1571.0, 750.0, 430.0, 239.0, 164.0, 89.0, 54.0, 34.0, 28.0, 18.0, 9.0, 8.0, 12.0, 7.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2932586669921875, -1.245697021484375, -1.1981353759765625, -1.15057373046875, -1.1030120849609375, -1.055450439453125, -1.0078887939453125, -0.9603271484375, -0.9127655029296875, -0.865203857421875, -0.8176422119140625, -0.77008056640625, -0.7225189208984375, -0.674957275390625, -0.6273956298828125, -0.579833984375, -0.5322723388671875, -0.484710693359375, -0.4371490478515625, -0.38958740234375, -0.3420257568359375, -0.294464111328125, -0.2469024658203125, -0.1993408203125, -0.1517791748046875, -0.104217529296875, -0.0566558837890625, -0.00909423828125, 0.0384674072265625, 0.086029052734375, 0.1335906982421875, 0.18115234375, 0.2287139892578125, 0.276275634765625, 0.3238372802734375, 0.37139892578125, 0.4189605712890625, 0.466522216796875, 0.5140838623046875, 0.5616455078125, 0.6092071533203125, 0.656768798828125, 0.7043304443359375, 0.75189208984375, 0.7994537353515625, 0.847015380859375, 0.8945770263671875, 0.942138671875, 0.9897003173828125, 1.037261962890625, 1.0848236083984375, 1.13238525390625, 1.1799468994140625, 1.227508544921875, 1.2750701904296875, 1.3226318359375, 1.3701934814453125, 1.417755126953125, 1.4653167724609375, 1.51287841796875, 1.5604400634765625, 1.608001708984375, 1.6555633544921875, 1.703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 13.0, 24.0, 27.0, 38.0, 50.0, 51.0, 103.0, 168.0, 121.0, 98.0, 64.0, 38.0, 35.0, 27.0, 30.0, 19.0, 15.0, 8.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5205078125, -1.4639129638671875, -1.407318115234375, -1.3507232666015625, -1.29412841796875, -1.2375335693359375, -1.180938720703125, -1.1243438720703125, -1.0677490234375, -1.0111541748046875, -0.954559326171875, -0.8979644775390625, -0.84136962890625, -0.7847747802734375, -0.728179931640625, -0.6715850830078125, -0.614990234375, -0.5583953857421875, -0.501800537109375, -0.4452056884765625, -0.38861083984375, -0.3320159912109375, -0.275421142578125, -0.2188262939453125, -0.1622314453125, -0.1056365966796875, -0.049041748046875, 0.0075531005859375, 0.06414794921875, 0.1207427978515625, 0.177337646484375, 0.2339324951171875, 0.29052734375, 0.3471221923828125, 0.403717041015625, 0.4603118896484375, 0.51690673828125, 0.5735015869140625, 0.630096435546875, 0.6866912841796875, 0.7432861328125, 0.7998809814453125, 0.856475830078125, 0.9130706787109375, 0.96966552734375, 1.0262603759765625, 1.082855224609375, 1.1394500732421875, 1.196044921875, 1.2526397705078125, 1.309234619140625, 1.3658294677734375, 1.42242431640625, 1.4790191650390625, 1.535614013671875, 1.5922088623046875, 1.6488037109375, 1.7053985595703125, 1.761993408203125, 1.8185882568359375, 1.87518310546875, 1.9317779541015625, 1.988372802734375, 2.0449676513671875, 2.1015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 15.0, 17.0, 23.0, 45.0, 58.0, 103.0, 155.0, 196.0, 137.0, 114.0, 55.0, 26.0, 20.0, 14.0, 9.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.74540901184082, -29.62629508972168, -28.50718116760254, -27.3880672454834, -26.26895523071289, -25.14984130859375, -24.03072738647461, -22.91161346435547, -21.792499542236328, -20.673385620117188, -19.554271697998047, -18.435157775878906, -17.316043853759766, -16.196929931640625, -15.077817916870117, -13.958703994750977, -12.839590072631836, -11.720476150512695, -10.601362228393555, -9.48224925994873, -8.36313533782959, -7.244021415710449, -6.124907970428467, -5.005794525146484, -3.8866806030273438, -2.7675669193267822, -1.6484532356262207, -0.5293395519256592, 0.5897741317749023, 1.708888053894043, 2.8280014991760254, 3.947114944458008, 5.066226959228516, 6.185340881347656, 7.304454326629639, 8.423567771911621, 9.542681694030762, 10.661795616149902, 11.780908584594727, 12.900022506713867, 14.019136428833008, 15.138250350952148, 16.25736427307129, 17.37647819519043, 18.495590209960938, 19.614704132080078, 20.73381805419922, 21.85293197631836, 22.9720458984375, 24.09115982055664, 25.21027374267578, 26.329387664794922, 27.448501586914062, 28.567615509033203, 29.68672752380371, 30.80584144592285, 31.924955368041992, 33.0440673828125, 34.16318130493164, 35.28229522705078, 36.40140914916992, 37.52052307128906, 38.6396369934082, 39.758750915527344, 40.877864837646484]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 11.0, 11.0, 15.0, 18.0, 26.0, 26.0, 26.0, 45.0, 58.0, 55.0, 78.0, 62.0, 65.0, 75.0, 58.0, 47.0, 58.0, 34.0, 38.0, 30.0, 29.0, 18.0, 23.0, 12.0, 12.0, 11.0, 7.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.724720001220703, -28.909807205200195, -28.094894409179688, -27.279979705810547, -26.46506690979004, -25.65015411376953, -24.835241317749023, -24.020328521728516, -23.205413818359375, -22.390501022338867, -21.57558822631836, -20.76067352294922, -19.94576072692871, -19.130847930908203, -18.315935134887695, -17.501022338867188, -16.686107635498047, -15.871194839477539, -15.056281089782715, -14.241368293762207, -13.426454544067383, -12.611541748046875, -11.796628952026367, -10.981715202331543, -10.166803359985352, -9.351890563964844, -8.53697681427002, -7.722064018249512, -6.9071502685546875, -6.09223747253418, -5.277324199676514, -4.462410926818848, -3.6474971771240234, -2.8325839042663574, -2.0176706314086914, -1.2027575969696045, -0.3878443241119385, 0.42706871032714844, 1.2419819831848145, 2.0568952560424805, 2.8718085289001465, 3.6867218017578125, 4.5016350746154785, 5.3165483474731445, 6.131461143493652, 6.946374416351318, 7.761287689208984, 8.576200485229492, 9.391114234924316, 10.206027030944824, 11.020940780639648, 11.835853576660156, 12.65076732635498, 13.465680122375488, 14.280593872070312, 15.09550666809082, 15.910419464111328, 16.725332260131836, 17.540245056152344, 18.355159759521484, 19.170072555541992, 19.9849853515625, 20.799898147583008, 21.614810943603516, 22.429725646972656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 8.0, 2.0, 9.0, 9.0, 7.0, 13.0, 17.0, 25.0, 31.0, 23.0, 53.0, 91.0, 122.0, 207.0, 341.0, 598.0, 1179.0, 2676.0, 7419.0, 46596.0, 4108544.0, 17963.0, 4701.0, 1845.0, 849.0, 402.0, 216.0, 129.0, 72.0, 43.0, 25.0, 17.0, 15.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.96026611328125, -7.7408447265625, -7.52142333984375, -7.302001953125, -7.08258056640625, -6.8631591796875, -6.64373779296875, -6.42431640625, -6.20489501953125, -5.9854736328125, -5.76605224609375, -5.546630859375, -5.32720947265625, -5.1077880859375, -4.88836669921875, -4.6689453125, -4.44952392578125, -4.2301025390625, -4.01068115234375, -3.791259765625, -3.57183837890625, -3.3524169921875, -3.13299560546875, -2.91357421875, -2.69415283203125, -2.4747314453125, -2.25531005859375, -2.035888671875, -1.81646728515625, -1.5970458984375, -1.37762451171875, -1.158203125, -0.93878173828125, -0.7193603515625, -0.49993896484375, -0.280517578125, -0.06109619140625, 0.1583251953125, 0.37774658203125, 0.59716796875, 0.81658935546875, 1.0360107421875, 1.25543212890625, 1.474853515625, 1.69427490234375, 1.9136962890625, 2.13311767578125, 2.3525390625, 2.57196044921875, 2.7913818359375, 3.01080322265625, 3.230224609375, 3.44964599609375, 3.6690673828125, 3.88848876953125, 4.10791015625, 4.32733154296875, 4.5467529296875, 4.76617431640625, 4.985595703125, 5.20501708984375, 5.4244384765625, 5.64385986328125, 5.86328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 3.0, 6.0, 12.0, 12.0, 17.0, 25.0, 38.0, 50.0, 64.0, 93.0, 110.0, 107.0, 96.0, 90.0, 90.0, 62.0, 39.0, 19.0, 18.0, 13.0, 8.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.34271240234375, -1.3035888671875, -1.26446533203125, -1.225341796875, -1.18621826171875, -1.1470947265625, -1.10797119140625, -1.06884765625, -1.02972412109375, -0.9906005859375, -0.95147705078125, -0.912353515625, -0.87322998046875, -0.8341064453125, -0.79498291015625, -0.755859375, -0.71673583984375, -0.6776123046875, -0.63848876953125, -0.599365234375, -0.56024169921875, -0.5211181640625, -0.48199462890625, -0.44287109375, -0.40374755859375, -0.3646240234375, -0.32550048828125, -0.286376953125, -0.24725341796875, -0.2081298828125, -0.16900634765625, -0.1298828125, -0.09075927734375, -0.0516357421875, -0.01251220703125, 0.026611328125, 0.06573486328125, 0.1048583984375, 0.14398193359375, 0.18310546875, 0.22222900390625, 0.2613525390625, 0.30047607421875, 0.339599609375, 0.37872314453125, 0.4178466796875, 0.45697021484375, 0.49609375, 0.53521728515625, 0.5743408203125, 0.61346435546875, 0.652587890625, 0.69171142578125, 0.7308349609375, 0.76995849609375, 0.80908203125, 0.84820556640625, 0.8873291015625, 0.92645263671875, 0.965576171875, 1.00469970703125, 1.0438232421875, 1.08294677734375, 1.1220703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 17.0, 26.0, 39.0, 52.0, 74.0, 100.0, 113.0, 146.0, 216.0, 296.0, 432.0, 540.0, 820.0, 1245.0, 1816.0, 3049.0, 5212.0, 10296.0, 25688.0, 854346.0, 3239453.0, 25768.0, 10387.0, 5231.0, 3016.0, 1764.0, 1183.0, 795.0, 558.0, 386.0, 303.0, 184.0, 182.0, 131.0, 89.0, 69.0, 57.0, 39.0, 36.0, 21.0, 17.0, 14.0, 11.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.9375, -5.76287841796875, -5.5882568359375, -5.41363525390625, -5.239013671875, -5.06439208984375, -4.8897705078125, -4.71514892578125, -4.54052734375, -4.36590576171875, -4.1912841796875, -4.01666259765625, -3.842041015625, -3.66741943359375, -3.4927978515625, -3.31817626953125, -3.1435546875, -2.96893310546875, -2.7943115234375, -2.61968994140625, -2.445068359375, -2.27044677734375, -2.0958251953125, -1.92120361328125, -1.74658203125, -1.57196044921875, -1.3973388671875, -1.22271728515625, -1.048095703125, -0.87347412109375, -0.6988525390625, -0.52423095703125, -0.349609375, -0.17498779296875, -0.0003662109375, 0.17425537109375, 0.348876953125, 0.52349853515625, 0.6981201171875, 0.87274169921875, 1.04736328125, 1.22198486328125, 1.3966064453125, 1.57122802734375, 1.745849609375, 1.92047119140625, 2.0950927734375, 2.26971435546875, 2.4443359375, 2.61895751953125, 2.7935791015625, 2.96820068359375, 3.142822265625, 3.31744384765625, 3.4920654296875, 3.66668701171875, 3.84130859375, 4.01593017578125, 4.1905517578125, 4.36517333984375, 4.539794921875, 4.71441650390625, 4.8890380859375, 5.06365966796875, 5.23828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 9.0, 10.0, 12.0, 12.0, 23.0, 71.0, 3711.0, 94.0, 40.0, 28.0, 15.0, 7.0, 11.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.137420654296875, -2.07171630859375, -2.006011962890625, -1.9403076171875, -1.874603271484375, -1.80889892578125, -1.743194580078125, -1.677490234375, -1.611785888671875, -1.54608154296875, -1.480377197265625, -1.4146728515625, -1.348968505859375, -1.28326416015625, -1.217559814453125, -1.15185546875, -1.086151123046875, -1.02044677734375, -0.954742431640625, -0.8890380859375, -0.823333740234375, -0.75762939453125, -0.691925048828125, -0.626220703125, -0.560516357421875, -0.49481201171875, -0.429107666015625, -0.3634033203125, -0.297698974609375, -0.23199462890625, -0.166290283203125, -0.1005859375, -0.034881591796875, 0.03082275390625, 0.096527099609375, 0.1622314453125, 0.227935791015625, 0.29364013671875, 0.359344482421875, 0.425048828125, 0.490753173828125, 0.55645751953125, 0.622161865234375, 0.6878662109375, 0.753570556640625, 0.81927490234375, 0.884979248046875, 0.95068359375, 1.016387939453125, 1.08209228515625, 1.147796630859375, 1.2135009765625, 1.279205322265625, 1.34490966796875, 1.410614013671875, 1.476318359375, 1.542022705078125, 1.60772705078125, 1.673431396484375, 1.7391357421875, 1.804840087890625, 1.87054443359375, 1.936248779296875, 2.001953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 18.0, 26.0, 36.0, 78.0, 91.0, 144.0, 144.0, 99.0, 105.0, 63.0, 47.0, 28.0, 23.0, 11.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044249534606934, -7.791569709777832, -7.538889408111572, -7.286209583282471, -7.033529281616211, -6.780849456787109, -6.528169631958008, -6.275489807128906, -6.0228095054626465, -5.770129680633545, -5.517449378967285, -5.264769554138184, -5.012089729309082, -4.759409427642822, -4.506729602813721, -4.254049301147461, -4.001369476318359, -3.7486894130706787, -3.496009349822998, -3.2433295249938965, -2.990649461746216, -2.737969398498535, -2.4852895736694336, -2.232609510421753, -1.9799294471740723, -1.7272493839263916, -1.4745694398880005, -1.2218894958496094, -0.9692094326019287, -0.716529369354248, -0.46384942531585693, -0.21116948127746582, 0.04150962829589844, 0.2941896319389343, 0.5468696355819702, 0.7995496392250061, 1.052229642868042, 1.3049097061157227, 1.5575896501541138, 1.8102695941925049, 2.0629496574401855, 2.315629720687866, 2.568309783935547, 2.8209896087646484, 3.073669672012329, 3.3263497352600098, 3.5790295600891113, 3.831709623336792, 4.084389686584473, 4.337069511413574, 4.589749813079834, 4.8424296379089355, 5.095109939575195, 5.347789764404297, 5.600469589233398, 5.8531494140625, 6.10582971572876, 6.358509540557861, 6.611189842224121, 6.863869667053223, 7.116549491882324, 7.369229793548584, 7.6219096183776855, 7.874589920043945, 8.127269744873047]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 14.0, 8.0, 23.0, 16.0, 16.0, 16.0, 20.0, 14.0, 22.0, 25.0, 29.0, 32.0, 29.0, 33.0, 38.0, 49.0, 38.0, 43.0, 45.0, 39.0, 44.0, 43.0, 35.0, 38.0, 32.0, 35.0, 29.0, 26.0, 23.0, 25.0, 18.0, 12.0, 9.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.204047203063965, -5.041396141052246, -4.878745079040527, -4.716094017028809, -4.55344295501709, -4.390791893005371, -4.228140830993652, -4.065489768981934, -3.9028384685516357, -3.740187406539917, -3.5775363445281982, -3.4148852825164795, -3.2522339820861816, -3.089582920074463, -2.926931858062744, -2.7642807960510254, -2.6016297340393066, -2.438978672027588, -2.276327610015869, -2.1136765480041504, -1.951025366783142, -1.7883743047714233, -1.625723123550415, -1.4630720615386963, -1.3004209995269775, -1.1377699375152588, -0.9751188158988953, -0.8124676942825317, -0.649816632270813, -0.48716557025909424, -0.3245144486427307, -0.1618633270263672, 0.0007877349853515625, 0.1634388267993927, 0.32608991861343384, 0.488741010427475, 0.6513921022415161, 0.8140431642532349, 0.9766942858695984, 1.139345407485962, 1.3019964694976807, 1.4646475315093994, 1.6272985935211182, 1.7899497747421265, 1.9526008367538452, 2.1152520179748535, 2.2779030799865723, 2.440554141998291, 2.6032052040100098, 2.7658562660217285, 2.9285073280334473, 3.091158390045166, 3.2538094520568848, 3.4164605140686035, 3.5791118144989014, 3.74176287651062, 3.904413938522339, 4.067065238952637, 4.2297163009643555, 4.392367362976074, 4.555018424987793, 4.717669486999512, 4.8803205490112305, 5.042971611022949, 5.205622673034668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 12.0, 10.0, 14.0, 25.0, 27.0, 40.0, 69.0, 76.0, 145.0, 188.0, 321.0, 508.0, 747.0, 1360.0, 2433.0, 4817.0, 10013.0, 23870.0, 68408.0, 266204.0, 474316.0, 126769.0, 38578.0, 14852.0, 6771.0, 3392.0, 1807.0, 1003.0, 616.0, 368.0, 259.0, 150.0, 94.0, 70.0, 69.0, 40.0, 27.0, 16.0, 19.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.166015625, -3.070770263671875, -2.97552490234375, -2.880279541015625, -2.7850341796875, -2.689788818359375, -2.59454345703125, -2.499298095703125, -2.404052734375, -2.308807373046875, -2.21356201171875, -2.118316650390625, -2.0230712890625, -1.927825927734375, -1.83258056640625, -1.737335205078125, -1.64208984375, -1.546844482421875, -1.45159912109375, -1.356353759765625, -1.2611083984375, -1.165863037109375, -1.07061767578125, -0.975372314453125, -0.880126953125, -0.784881591796875, -0.68963623046875, -0.594390869140625, -0.4991455078125, -0.403900146484375, -0.30865478515625, -0.213409423828125, -0.1181640625, -0.022918701171875, 0.07232666015625, 0.167572021484375, 0.2628173828125, 0.358062744140625, 0.45330810546875, 0.548553466796875, 0.643798828125, 0.739044189453125, 0.83428955078125, 0.929534912109375, 1.0247802734375, 1.120025634765625, 1.21527099609375, 1.310516357421875, 1.40576171875, 1.501007080078125, 1.59625244140625, 1.691497802734375, 1.7867431640625, 1.881988525390625, 1.97723388671875, 2.072479248046875, 2.167724609375, 2.262969970703125, 2.35821533203125, 2.453460693359375, 2.5487060546875, 2.643951416015625, 2.73919677734375, 2.834442138671875, 2.9296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 2.0, 4.0, 7.0, 16.0, 12.0, 17.0, 22.0, 35.0, 35.0, 47.0, 40.0, 69.0, 72.0, 99.0, 85.0, 87.0, 72.0, 50.0, 40.0, 49.0, 39.0, 33.0, 17.0, 14.0, 9.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5146484375, -1.4702911376953125, -1.425933837890625, -1.3815765380859375, -1.33721923828125, -1.2928619384765625, -1.248504638671875, -1.2041473388671875, -1.1597900390625, -1.1154327392578125, -1.071075439453125, -1.0267181396484375, -0.98236083984375, -0.9380035400390625, -0.893646240234375, -0.8492889404296875, -0.804931640625, -0.7605743408203125, -0.716217041015625, -0.6718597412109375, -0.62750244140625, -0.5831451416015625, -0.538787841796875, -0.4944305419921875, -0.4500732421875, -0.4057159423828125, -0.361358642578125, -0.3170013427734375, -0.27264404296875, -0.2282867431640625, -0.183929443359375, -0.1395721435546875, -0.09521484375, -0.0508575439453125, -0.006500244140625, 0.0378570556640625, 0.08221435546875, 0.1265716552734375, 0.170928955078125, 0.2152862548828125, 0.2596435546875, 0.3040008544921875, 0.348358154296875, 0.3927154541015625, 0.43707275390625, 0.4814300537109375, 0.525787353515625, 0.5701446533203125, 0.614501953125, 0.6588592529296875, 0.703216552734375, 0.7475738525390625, 0.79193115234375, 0.8362884521484375, 0.880645751953125, 0.9250030517578125, 0.9693603515625, 1.0137176513671875, 1.058074951171875, 1.1024322509765625, 1.14678955078125, 1.1911468505859375, 1.235504150390625, 1.2798614501953125, 1.32421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 8.0, 5.0, 26.0, 49.0, 54.0, 106.0, 196.0, 355.0, 742.0, 1703.0, 4871.0, 19662.0, 164109.0, 769441.0, 69662.0, 11596.0, 3437.0, 1235.0, 570.0, 297.0, 159.0, 100.0, 51.0, 40.0, 28.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.795166015625, -7.52001953125, -7.244873046875, -6.9697265625, -6.694580078125, -6.41943359375, -6.144287109375, -5.869140625, -5.593994140625, -5.31884765625, -5.043701171875, -4.7685546875, -4.493408203125, -4.21826171875, -3.943115234375, -3.66796875, -3.392822265625, -3.11767578125, -2.842529296875, -2.5673828125, -2.292236328125, -2.01708984375, -1.741943359375, -1.466796875, -1.191650390625, -0.91650390625, -0.641357421875, -0.3662109375, -0.091064453125, 0.18408203125, 0.459228515625, 0.734375, 1.009521484375, 1.28466796875, 1.559814453125, 1.8349609375, 2.110107421875, 2.38525390625, 2.660400390625, 2.935546875, 3.210693359375, 3.48583984375, 3.760986328125, 4.0361328125, 4.311279296875, 4.58642578125, 4.861572265625, 5.13671875, 5.411865234375, 5.68701171875, 5.962158203125, 6.2373046875, 6.512451171875, 6.78759765625, 7.062744140625, 7.337890625, 7.613037109375, 7.88818359375, 8.163330078125, 8.4384765625, 8.713623046875, 8.98876953125, 9.263916015625, 9.5390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 8.0, 19.0, 12.0, 16.0, 23.0, 41.0, 47.0, 58.0, 47.0, 71.0, 84.0, 96.0, 75.0, 71.0, 49.0, 50.0, 43.0, 33.0, 37.0, 18.0, 22.0, 9.0, 13.0, 10.0, 10.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6796875, -9.35302734375, -9.0263671875, -8.69970703125, -8.373046875, -8.04638671875, -7.7197265625, -7.39306640625, -7.06640625, -6.73974609375, -6.4130859375, -6.08642578125, -5.759765625, -5.43310546875, -5.1064453125, -4.77978515625, -4.453125, -4.12646484375, -3.7998046875, -3.47314453125, -3.146484375, -2.81982421875, -2.4931640625, -2.16650390625, -1.83984375, -1.51318359375, -1.1865234375, -0.85986328125, -0.533203125, -0.20654296875, 0.1201171875, 0.44677734375, 0.7734375, 1.10009765625, 1.4267578125, 1.75341796875, 2.080078125, 2.40673828125, 2.7333984375, 3.06005859375, 3.38671875, 3.71337890625, 4.0400390625, 4.36669921875, 4.693359375, 5.02001953125, 5.3466796875, 5.67333984375, 6.0, 6.32666015625, 6.6533203125, 6.97998046875, 7.306640625, 7.63330078125, 7.9599609375, 8.28662109375, 8.61328125, 8.93994140625, 9.2666015625, 9.59326171875, 9.919921875, 10.24658203125, 10.5732421875, 10.89990234375, 11.2265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 4.0, 15.0, 14.0, 32.0, 59.0, 75.0, 141.0, 285.0, 751.0, 3179.0, 137673.0, 898530.0, 5919.0, 1046.0, 382.0, 163.0, 104.0, 58.0, 38.0, 30.0, 12.0, 14.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.162109375, -9.85546875, -9.548828125, -9.2421875, -8.935546875, -8.62890625, -8.322265625, -8.015625, -7.708984375, -7.40234375, -7.095703125, -6.7890625, -6.482421875, -6.17578125, -5.869140625, -5.5625, -5.255859375, -4.94921875, -4.642578125, -4.3359375, -4.029296875, -3.72265625, -3.416015625, -3.109375, -2.802734375, -2.49609375, -2.189453125, -1.8828125, -1.576171875, -1.26953125, -0.962890625, -0.65625, -0.349609375, -0.04296875, 0.263671875, 0.5703125, 0.876953125, 1.18359375, 1.490234375, 1.796875, 2.103515625, 2.41015625, 2.716796875, 3.0234375, 3.330078125, 3.63671875, 3.943359375, 4.25, 4.556640625, 4.86328125, 5.169921875, 5.4765625, 5.783203125, 6.08984375, 6.396484375, 6.703125, 7.009765625, 7.31640625, 7.623046875, 7.9296875, 8.236328125, 8.54296875, 8.849609375, 9.15625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 14.0, 38.0, 65.0, 153.0, 278.0, 221.0, 126.0, 49.0, 25.0, 14.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.0006571859121322632, -0.0006344020366668701, -0.000611618161201477, -0.000588834285736084, -0.0005660504102706909, -0.0005432665348052979, -0.0005204826593399048, -0.0004976987838745117, -0.00047491490840911865, -0.0004521310329437256, -0.0004293471574783325, -0.00040656328201293945, -0.0003837794065475464, -0.0003609955310821533, -0.00033821165561676025, -0.0003154277801513672, -0.0002926439046859741, -0.00026986002922058105, -0.000247076153755188, -0.00022429227828979492, -0.00020150840282440186, -0.0001787245273590088, -0.00015594065189361572, -0.00013315677642822266, -0.00011037290096282959, -8.758902549743652e-05, -6.480515003204346e-05, -4.202127456665039e-05, -1.9237399101257324e-05, 3.546476364135742e-06, 2.633035182952881e-05, 4.9114227294921875e-05, 7.189810276031494e-05, 9.468197822570801e-05, 0.00011746585369110107, 0.00014024972915649414, 0.0001630336046218872, 0.00018581748008728027, 0.00020860135555267334, 0.0002313852310180664, 0.00025416910648345947, 0.00027695298194885254, 0.0002997368574142456, 0.00032252073287963867, 0.00034530460834503174, 0.0003680884838104248, 0.00039087235927581787, 0.00041365623474121094, 0.000436440110206604, 0.00045922398567199707, 0.00048200786113739014, 0.0005047917366027832, 0.0005275756120681763, 0.0005503594875335693, 0.0005731433629989624, 0.0005959272384643555, 0.0006187111139297485, 0.0006414949893951416, 0.0006642788648605347, 0.0006870627403259277, 0.0007098466157913208, 0.0007326304912567139, 0.0007554143667221069, 0.0007781982421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 15.0, 19.0, 22.0, 47.0, 107.0, 168.0, 350.0, 827.0, 2188.0, 8513.0, 81563.0, 896578.0, 48473.0, 6427.0, 1879.0, 693.0, 303.0, 158.0, 81.0, 47.0, 30.0, 11.0, 9.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.89453125, -4.7523193359375, -4.610107421875, -4.4678955078125, -4.32568359375, -4.1834716796875, -4.041259765625, -3.8990478515625, -3.7568359375, -3.6146240234375, -3.472412109375, -3.3302001953125, -3.18798828125, -3.0457763671875, -2.903564453125, -2.7613525390625, -2.619140625, -2.4769287109375, -2.334716796875, -2.1925048828125, -2.05029296875, -1.9080810546875, -1.765869140625, -1.6236572265625, -1.4814453125, -1.3392333984375, -1.197021484375, -1.0548095703125, -0.91259765625, -0.7703857421875, -0.628173828125, -0.4859619140625, -0.34375, -0.2015380859375, -0.059326171875, 0.0828857421875, 0.22509765625, 0.3673095703125, 0.509521484375, 0.6517333984375, 0.7939453125, 0.9361572265625, 1.078369140625, 1.2205810546875, 1.36279296875, 1.5050048828125, 1.647216796875, 1.7894287109375, 1.931640625, 2.0738525390625, 2.216064453125, 2.3582763671875, 2.50048828125, 2.6427001953125, 2.784912109375, 2.9271240234375, 3.0693359375, 3.2115478515625, 3.353759765625, 3.4959716796875, 3.63818359375, 3.7803955078125, 3.922607421875, 4.0648193359375, 4.20703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 21.0, 23.0, 56.0, 144.0, 245.0, 243.0, 141.0, 61.0, 27.0, 10.0, 4.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.4990234375, -5.294921875, -5.0908203125, -4.88671875, -4.6826171875, -4.478515625, -4.2744140625, -4.0703125, -3.8662109375, -3.662109375, -3.4580078125, -3.25390625, -3.0498046875, -2.845703125, -2.6416015625, -2.4375, -2.2333984375, -2.029296875, -1.8251953125, -1.62109375, -1.4169921875, -1.212890625, -1.0087890625, -0.8046875, -0.6005859375, -0.396484375, -0.1923828125, 0.01171875, 0.2158203125, 0.419921875, 0.6240234375, 0.828125, 1.0322265625, 1.236328125, 1.4404296875, 1.64453125, 1.8486328125, 2.052734375, 2.2568359375, 2.4609375, 2.6650390625, 2.869140625, 3.0732421875, 3.27734375, 3.4814453125, 3.685546875, 3.8896484375, 4.09375, 4.2978515625, 4.501953125, 4.7060546875, 4.91015625, 5.1142578125, 5.318359375, 5.5224609375, 5.7265625, 5.9306640625, 6.134765625, 6.3388671875, 6.54296875, 6.7470703125, 6.951171875, 7.1552734375, 7.359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 10.0, 5.0, 9.0, 22.0, 24.0, 32.0, 59.0, 65.0, 110.0, 118.0, 132.0, 112.0, 94.0, 72.0, 37.0, 32.0, 17.0, 16.0, 11.0, 10.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.40155029296875, -56.9228630065918, -55.44417953491211, -53.965492248535156, -52.48680877685547, -51.008121490478516, -49.52943420410156, -48.050750732421875, -46.57206344604492, -45.09337615966797, -43.61469268798828, -42.13600540161133, -40.657318115234375, -39.17863464355469, -37.699947357177734, -36.22126007080078, -34.742576599121094, -33.26388931274414, -31.785205841064453, -30.3065185546875, -28.82783317565918, -27.34914779663086, -25.870460510253906, -24.391775131225586, -22.913089752197266, -21.434404373168945, -19.955718994140625, -18.477031707763672, -16.99834632873535, -15.519660949707031, -14.040974617004395, -12.562288284301758, -11.083602905273438, -9.604917526245117, -8.12623119354248, -6.647545337677002, -5.168859481811523, -3.690173625946045, -2.2114877700805664, -0.7328014373779297, 0.7458839416503906, 2.224569797515869, 3.7032556533813477, 5.181941509246826, 6.660627365112305, 8.139312744140625, 9.617999076843262, 11.096685409545898, 12.575370788574219, 14.054056167602539, 15.532742500305176, 17.011428833007812, 18.490114212036133, 19.968799591064453, 21.447486877441406, 22.926172256469727, 24.404857635498047, 25.883543014526367, 27.362228393554688, 28.84091567993164, 30.31960105895996, 31.79828643798828, 33.276973724365234, 34.75566101074219, 36.234344482421875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 10.0, 6.0, 11.0, 17.0, 15.0, 23.0, 23.0, 22.0, 36.0, 40.0, 44.0, 49.0, 59.0, 57.0, 71.0, 65.0, 58.0, 56.0, 47.0, 53.0, 55.0, 34.0, 22.0, 25.0, 13.0, 15.0, 14.0, 8.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.012306213378906, -50.55244827270508, -49.09259033203125, -47.63273239135742, -46.172874450683594, -44.713016510009766, -43.25315856933594, -41.79330062866211, -40.33344268798828, -38.87358474731445, -37.413726806640625, -35.9538688659668, -34.49401092529297, -33.03415298461914, -31.574295043945312, -30.114437103271484, -28.654577255249023, -27.194719314575195, -25.734861373901367, -24.27500343322754, -22.81514549255371, -21.355287551879883, -19.895427703857422, -18.435569763183594, -16.975711822509766, -15.515853881835938, -14.05599594116211, -12.596138000488281, -11.136280059814453, -9.676422119140625, -8.21656322479248, -6.756705284118652, -5.296848297119141, -3.8369903564453125, -2.3771321773529053, -0.917273998260498, 0.5425839424133301, 2.002441883087158, 3.4623003005981445, 4.922158241271973, 6.382016181945801, 7.841874122619629, 9.301732063293457, 10.761590957641602, 12.22144889831543, 13.681306838989258, 15.141164779663086, 16.601022720336914, 18.060880661010742, 19.52073860168457, 20.9805965423584, 22.440454483032227, 23.900312423706055, 25.360170364379883, 26.820030212402344, 28.279888153076172, 29.73974609375, 31.199604034423828, 32.659461975097656, 34.119319915771484, 35.57917785644531, 37.03903579711914, 38.49889373779297, 39.9587516784668, 41.418609619140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 11.0, 8.0, 10.0, 17.0, 23.0, 45.0, 69.0, 106.0, 212.0, 399.0, 1073.0, 4646.0, 4179404.0, 6065.0, 1262.0, 440.0, 211.0, 103.0, 63.0, 35.0, 27.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.177978515625, -27.46533203125, -26.752685546875, -26.0400390625, -25.327392578125, -24.61474609375, -23.902099609375, -23.189453125, -22.476806640625, -21.76416015625, -21.051513671875, -20.3388671875, -19.626220703125, -18.91357421875, -18.200927734375, -17.48828125, -16.775634765625, -16.06298828125, -15.350341796875, -14.6376953125, -13.925048828125, -13.21240234375, -12.499755859375, -11.787109375, -11.074462890625, -10.36181640625, -9.649169921875, -8.9365234375, -8.223876953125, -7.51123046875, -6.798583984375, -6.0859375, -5.373291015625, -4.66064453125, -3.947998046875, -3.2353515625, -2.522705078125, -1.81005859375, -1.097412109375, -0.384765625, 0.327880859375, 1.04052734375, 1.753173828125, 2.4658203125, 3.178466796875, 3.89111328125, 4.603759765625, 5.31640625, 6.029052734375, 6.74169921875, 7.454345703125, 8.1669921875, 8.879638671875, 9.59228515625, 10.304931640625, 11.017578125, 11.730224609375, 12.44287109375, 13.155517578125, 13.8681640625, 14.580810546875, 15.29345703125, 16.006103515625, 16.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 15.0, 20.0, 38.0, 49.0, 81.0, 111.0, 152.0, 151.0, 128.0, 73.0, 45.0, 41.0, 21.0, 14.0, 5.0, 15.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.23248291015625, -3.1368408203125, -3.04119873046875, -2.945556640625, -2.84991455078125, -2.7542724609375, -2.65863037109375, -2.56298828125, -2.46734619140625, -2.3717041015625, -2.27606201171875, -2.180419921875, -2.08477783203125, -1.9891357421875, -1.89349365234375, -1.7978515625, -1.70220947265625, -1.6065673828125, -1.51092529296875, -1.415283203125, -1.31964111328125, -1.2239990234375, -1.12835693359375, -1.03271484375, -0.93707275390625, -0.8414306640625, -0.74578857421875, -0.650146484375, -0.55450439453125, -0.4588623046875, -0.36322021484375, -0.267578125, -0.17193603515625, -0.0762939453125, 0.01934814453125, 0.114990234375, 0.21063232421875, 0.3062744140625, 0.40191650390625, 0.49755859375, 0.59320068359375, 0.6888427734375, 0.78448486328125, 0.880126953125, 0.97576904296875, 1.0714111328125, 1.16705322265625, 1.2626953125, 1.35833740234375, 1.4539794921875, 1.54962158203125, 1.645263671875, 1.74090576171875, 1.8365478515625, 1.93218994140625, 2.02783203125, 2.12347412109375, 2.2191162109375, 2.31475830078125, 2.410400390625, 2.50604248046875, 2.6016845703125, 2.69732666015625, 2.79296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 5.0, 9.0, 12.0, 23.0, 33.0, 39.0, 37.0, 49.0, 83.0, 106.0, 149.0, 167.0, 237.0, 323.0, 462.0, 685.0, 1075.0, 2079.0, 7041.0, 4152728.0, 21295.0, 3340.0, 1452.0, 855.0, 560.0, 400.0, 295.0, 200.0, 137.0, 101.0, 73.0, 63.0, 44.0, 18.0, 24.0, 18.0, 18.0, 9.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.375, -18.817138671875, -18.25927734375, -17.701416015625, -17.1435546875, -16.585693359375, -16.02783203125, -15.469970703125, -14.912109375, -14.354248046875, -13.79638671875, -13.238525390625, -12.6806640625, -12.122802734375, -11.56494140625, -11.007080078125, -10.44921875, -9.891357421875, -9.33349609375, -8.775634765625, -8.2177734375, -7.659912109375, -7.10205078125, -6.544189453125, -5.986328125, -5.428466796875, -4.87060546875, -4.312744140625, -3.7548828125, -3.197021484375, -2.63916015625, -2.081298828125, -1.5234375, -0.965576171875, -0.40771484375, 0.150146484375, 0.7080078125, 1.265869140625, 1.82373046875, 2.381591796875, 2.939453125, 3.497314453125, 4.05517578125, 4.613037109375, 5.1708984375, 5.728759765625, 6.28662109375, 6.844482421875, 7.40234375, 7.960205078125, 8.51806640625, 9.075927734375, 9.6337890625, 10.191650390625, 10.74951171875, 11.307373046875, 11.865234375, 12.423095703125, 12.98095703125, 13.538818359375, 14.0966796875, 14.654541015625, 15.21240234375, 15.770263671875, 16.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 10.0, 10.0, 104.0, 3906.0, 30.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.652984619140625, -4.52081298828125, -4.388641357421875, -4.2564697265625, -4.124298095703125, -3.99212646484375, -3.859954833984375, -3.727783203125, -3.595611572265625, -3.46343994140625, -3.331268310546875, -3.1990966796875, -3.066925048828125, -2.93475341796875, -2.802581787109375, -2.67041015625, -2.538238525390625, -2.40606689453125, -2.273895263671875, -2.1417236328125, -2.009552001953125, -1.87738037109375, -1.745208740234375, -1.613037109375, -1.480865478515625, -1.34869384765625, -1.216522216796875, -1.0843505859375, -0.952178955078125, -0.82000732421875, -0.687835693359375, -0.5556640625, -0.423492431640625, -0.29132080078125, -0.159149169921875, -0.0269775390625, 0.105194091796875, 0.23736572265625, 0.369537353515625, 0.501708984375, 0.633880615234375, 0.76605224609375, 0.898223876953125, 1.0303955078125, 1.162567138671875, 1.29473876953125, 1.426910400390625, 1.55908203125, 1.691253662109375, 1.82342529296875, 1.955596923828125, 2.0877685546875, 2.219940185546875, 2.35211181640625, 2.484283447265625, 2.616455078125, 2.748626708984375, 2.88079833984375, 3.012969970703125, 3.1451416015625, 3.277313232421875, 3.40948486328125, 3.541656494140625, 3.673828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 8.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 27.0, 29.0, 33.0, 49.0, 62.0, 88.0, 123.0, 122.0, 121.0, 87.0, 56.0, 37.0, 31.0, 18.0, 19.0, 14.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.563186645507812, -8.302862167358398, -8.042536735534668, -7.782212257385254, -7.521887302398682, -7.261562347412109, -7.001237869262695, -6.740912914276123, -6.480587959289551, -6.2202630043029785, -5.9599385261535645, -5.699613571166992, -5.43928861618042, -5.178963661193848, -4.918639183044434, -4.658314228057861, -4.397989749908447, -4.137664794921875, -3.877340078353882, -3.6170153617858887, -3.3566904067993164, -3.0963656902313232, -2.83604097366333, -2.575716018676758, -2.3153913021087646, -2.0550665855407715, -1.7947416305541992, -1.534416913986206, -1.2740920782089233, -1.0137672424316406, -0.7534425258636475, -0.49311769008636475, -0.23279285430908203, 0.027531951665878296, 0.2878567576408386, 0.5481815338134766, 0.8085063695907593, 1.068831205368042, 1.3291559219360352, 1.5894807577133179, 1.8498055934906006, 2.1101303100585938, 2.370455265045166, 2.630779981613159, 2.8911046981811523, 3.1514296531677246, 3.4117543697357178, 3.672079086303711, 3.932404041290283, 4.1927289962768555, 4.4530534744262695, 4.713378429412842, 4.973703384399414, 5.234027862548828, 5.4943528175354, 5.754677772521973, 6.015002250671387, 6.275327205657959, 6.535651683807373, 6.795976638793945, 7.056301593780518, 7.31662654876709, 7.576951026916504, 7.837275981903076, 8.097600936889648]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 13.0, 4.0, 11.0, 15.0, 12.0, 17.0, 21.0, 19.0, 33.0, 28.0, 33.0, 42.0, 42.0, 42.0, 36.0, 47.0, 32.0, 39.0, 44.0, 43.0, 29.0, 48.0, 44.0, 29.0, 29.0, 35.0, 26.0, 27.0, 20.0, 30.0, 12.0, 19.0, 12.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.181884288787842, -5.013457775115967, -4.84503173828125, -4.676605224609375, -4.5081787109375, -4.339752197265625, -4.17132568359375, -4.002899646759033, -3.834473133087158, -3.666046619415283, -3.4976203441619873, -3.3291940689086914, -3.1607675552368164, -2.9923410415649414, -2.8239147663116455, -2.6554884910583496, -2.4870619773864746, -2.3186354637145996, -2.1502091884613037, -1.9817827939987183, -1.8133563995361328, -1.6449300050735474, -1.476503610610962, -1.3080772161483765, -1.139650821685791, -0.9712244272232056, -0.8027980327606201, -0.6343716382980347, -0.4659452438354492, -0.29751884937286377, -0.12909245491027832, 0.03933393955230713, 0.20776081085205078, 0.37618720531463623, 0.5446135997772217, 0.7130399942398071, 0.8814663887023926, 1.049892783164978, 1.2183191776275635, 1.386745572090149, 1.5551719665527344, 1.7235983610153198, 1.8920247554779053, 2.060451030731201, 2.228877544403076, 2.397304058074951, 2.565730333328247, 2.734156608581543, 2.902583122253418, 3.071009635925293, 3.239435911178589, 3.4078621864318848, 3.5762887001037598, 3.7447152137756348, 3.9131414890289307, 4.081567764282227, 4.249994277954102, 4.418420791625977, 4.586847305297852, 4.755273342132568, 4.923699855804443, 5.092126369476318, 5.260552406311035, 5.42897891998291, 5.597405433654785]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 11.0, 11.0, 16.0, 19.0, 25.0, 45.0, 65.0, 100.0, 117.0, 189.0, 286.0, 458.0, 745.0, 1236.0, 2125.0, 4062.0, 8860.0, 23143.0, 77170.0, 410671.0, 402437.0, 75388.0, 22773.0, 8931.0, 4200.0, 2113.0, 1178.0, 774.0, 473.0, 288.0, 199.0, 119.0, 93.0, 58.0, 45.0, 40.0, 24.0, 17.0, 9.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.91015625, -4.77374267578125, -4.6373291015625, -4.50091552734375, -4.364501953125, -4.22808837890625, -4.0916748046875, -3.95526123046875, -3.81884765625, -3.68243408203125, -3.5460205078125, -3.40960693359375, -3.273193359375, -3.13677978515625, -3.0003662109375, -2.86395263671875, -2.7275390625, -2.59112548828125, -2.4547119140625, -2.31829833984375, -2.181884765625, -2.04547119140625, -1.9090576171875, -1.77264404296875, -1.63623046875, -1.49981689453125, -1.3634033203125, -1.22698974609375, -1.090576171875, -0.95416259765625, -0.8177490234375, -0.68133544921875, -0.544921875, -0.40850830078125, -0.2720947265625, -0.13568115234375, 0.000732421875, 0.13714599609375, 0.2735595703125, 0.40997314453125, 0.54638671875, 0.68280029296875, 0.8192138671875, 0.95562744140625, 1.092041015625, 1.22845458984375, 1.3648681640625, 1.50128173828125, 1.6376953125, 1.77410888671875, 1.9105224609375, 2.04693603515625, 2.183349609375, 2.31976318359375, 2.4561767578125, 2.59259033203125, 2.72900390625, 2.86541748046875, 3.0018310546875, 3.13824462890625, 3.274658203125, 3.41107177734375, 3.5474853515625, 3.68389892578125, 3.8203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 3.0, 12.0, 19.0, 12.0, 18.0, 35.0, 52.0, 56.0, 84.0, 83.0, 103.0, 119.0, 83.0, 72.0, 56.0, 50.0, 36.0, 18.0, 15.0, 17.0, 7.0, 6.0, 2.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.537109375, -2.459625244140625, -2.38214111328125, -2.304656982421875, -2.2271728515625, -2.149688720703125, -2.07220458984375, -1.994720458984375, -1.917236328125, -1.839752197265625, -1.76226806640625, -1.684783935546875, -1.6072998046875, -1.529815673828125, -1.45233154296875, -1.374847412109375, -1.29736328125, -1.219879150390625, -1.14239501953125, -1.064910888671875, -0.9874267578125, -0.909942626953125, -0.83245849609375, -0.754974365234375, -0.677490234375, -0.600006103515625, -0.52252197265625, -0.445037841796875, -0.3675537109375, -0.290069580078125, -0.21258544921875, -0.135101318359375, -0.0576171875, 0.019866943359375, 0.09735107421875, 0.174835205078125, 0.2523193359375, 0.329803466796875, 0.40728759765625, 0.484771728515625, 0.562255859375, 0.639739990234375, 0.71722412109375, 0.794708251953125, 0.8721923828125, 0.949676513671875, 1.02716064453125, 1.104644775390625, 1.18212890625, 1.259613037109375, 1.33709716796875, 1.414581298828125, 1.4920654296875, 1.569549560546875, 1.64703369140625, 1.724517822265625, 1.802001953125, 1.879486083984375, 1.95697021484375, 2.034454345703125, 2.1119384765625, 2.189422607421875, 2.26690673828125, 2.344390869140625, 2.421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 6.0, 6.0, 9.0, 8.0, 16.0, 18.0, 23.0, 47.0, 71.0, 103.0, 204.0, 289.0, 612.0, 1439.0, 4029.0, 14423.0, 80200.0, 713534.0, 196831.0, 26291.0, 6315.0, 2150.0, 893.0, 439.0, 246.0, 123.0, 88.0, 40.0, 44.0, 18.0, 18.0, 12.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.6737060546875, -6.441162109375, -6.2086181640625, -5.97607421875, -5.7435302734375, -5.510986328125, -5.2784423828125, -5.0458984375, -4.8133544921875, -4.580810546875, -4.3482666015625, -4.11572265625, -3.8831787109375, -3.650634765625, -3.4180908203125, -3.185546875, -2.9530029296875, -2.720458984375, -2.4879150390625, -2.25537109375, -2.0228271484375, -1.790283203125, -1.5577392578125, -1.3251953125, -1.0926513671875, -0.860107421875, -0.6275634765625, -0.39501953125, -0.1624755859375, 0.070068359375, 0.3026123046875, 0.53515625, 0.7677001953125, 1.000244140625, 1.2327880859375, 1.46533203125, 1.6978759765625, 1.930419921875, 2.1629638671875, 2.3955078125, 2.6280517578125, 2.860595703125, 3.0931396484375, 3.32568359375, 3.5582275390625, 3.790771484375, 4.0233154296875, 4.255859375, 4.4884033203125, 4.720947265625, 4.9534912109375, 5.18603515625, 5.4185791015625, 5.651123046875, 5.8836669921875, 6.1162109375, 6.3487548828125, 6.581298828125, 6.8138427734375, 7.04638671875, 7.2789306640625, 7.511474609375, 7.7440185546875, 7.9765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 9.0, 15.0, 13.0, 22.0, 23.0, 27.0, 27.0, 37.0, 27.0, 47.0, 43.0, 53.0, 53.0, 58.0, 62.0, 48.0, 47.0, 49.0, 50.0, 45.0, 33.0, 41.0, 36.0, 26.0, 20.0, 17.0, 12.0, 8.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8265380859375, -8.535888671875, -8.2452392578125, -7.95458984375, -7.6639404296875, -7.373291015625, -7.0826416015625, -6.7919921875, -6.5013427734375, -6.210693359375, -5.9200439453125, -5.62939453125, -5.3387451171875, -5.048095703125, -4.7574462890625, -4.466796875, -4.1761474609375, -3.885498046875, -3.5948486328125, -3.30419921875, -3.0135498046875, -2.722900390625, -2.4322509765625, -2.1416015625, -1.8509521484375, -1.560302734375, -1.2696533203125, -0.97900390625, -0.6883544921875, -0.397705078125, -0.1070556640625, 0.18359375, 0.4742431640625, 0.764892578125, 1.0555419921875, 1.34619140625, 1.6368408203125, 1.927490234375, 2.2181396484375, 2.5087890625, 2.7994384765625, 3.090087890625, 3.3807373046875, 3.67138671875, 3.9620361328125, 4.252685546875, 4.5433349609375, 4.833984375, 5.1246337890625, 5.415283203125, 5.7059326171875, 5.99658203125, 6.2872314453125, 6.577880859375, 6.8685302734375, 7.1591796875, 7.4498291015625, 7.740478515625, 8.0311279296875, 8.32177734375, 8.6124267578125, 8.903076171875, 9.1937255859375, 9.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 20.0, 36.0, 35.0, 66.0, 147.0, 345.0, 2151.0, 138741.0, 901422.0, 4703.0, 482.0, 160.0, 89.0, 51.0, 33.0, 18.0, 10.0, 8.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -12.0401611328125, -11.697509765625, -11.3548583984375, -11.01220703125, -10.6695556640625, -10.326904296875, -9.9842529296875, -9.6416015625, -9.2989501953125, -8.956298828125, -8.6136474609375, -8.27099609375, -7.9283447265625, -7.585693359375, -7.2430419921875, -6.900390625, -6.5577392578125, -6.215087890625, -5.8724365234375, -5.52978515625, -5.1871337890625, -4.844482421875, -4.5018310546875, -4.1591796875, -3.8165283203125, -3.473876953125, -3.1312255859375, -2.78857421875, -2.4459228515625, -2.103271484375, -1.7606201171875, -1.41796875, -1.0753173828125, -0.732666015625, -0.3900146484375, -0.04736328125, 0.2952880859375, 0.637939453125, 0.9805908203125, 1.3232421875, 1.6658935546875, 2.008544921875, 2.3511962890625, 2.69384765625, 3.0364990234375, 3.379150390625, 3.7218017578125, 4.064453125, 4.4071044921875, 4.749755859375, 5.0924072265625, 5.43505859375, 5.7777099609375, 6.120361328125, 6.4630126953125, 6.8056640625, 7.1483154296875, 7.490966796875, 7.8336181640625, 8.17626953125, 8.5189208984375, 8.861572265625, 9.2042236328125, 9.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 13.0, 35.0, 60.0, 174.0, 279.0, 238.0, 95.0, 48.0, 29.0, 12.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003571510314941406, -0.0003290101885795593, -0.00030086934566497803, -0.00027272850275039673, -0.00024458765983581543, -0.00021644681692123413, -0.00018830597400665283, -0.00016016513109207153, -0.00013202428817749023, -0.00010388344526290894, -7.574260234832764e-05, -4.760175943374634e-05, -1.946091651916504e-05, 8.67992639541626e-06, 3.682076930999756e-05, 6.496161222457886e-05, 9.310245513916016e-05, 0.00012124329805374146, 0.00014938414096832275, 0.00017752498388290405, 0.00020566582679748535, 0.00023380666971206665, 0.00026194751262664795, 0.00029008835554122925, 0.00031822919845581055, 0.00034637004137039185, 0.00037451088428497314, 0.00040265172719955444, 0.00043079257011413574, 0.00045893341302871704, 0.00048707425594329834, 0.0005152150988578796, 0.0005433559417724609, 0.0005714967846870422, 0.0005996376276016235, 0.0006277784705162048, 0.0006559193134307861, 0.0006840601563453674, 0.0007122009992599487, 0.00074034184217453, 0.0007684826850891113, 0.0007966235280036926, 0.0008247643709182739, 0.0008529052138328552, 0.0008810460567474365, 0.0009091868996620178, 0.0009373277425765991, 0.0009654685854911804, 0.0009936094284057617, 0.001021750271320343, 0.0010498911142349243, 0.0010780319571495056, 0.001106172800064087, 0.0011343136429786682, 0.0011624544858932495, 0.0011905953288078308, 0.0012187361717224121, 0.0012468770146369934, 0.0012750178575515747, 0.001303158700466156, 0.0013312995433807373, 0.0013594403862953186, 0.0013875812292099, 0.0014157220721244812, 0.0014438629150390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 15.0, 6.0, 10.0, 24.0, 40.0, 73.0, 156.0, 350.0, 952.0, 3859.0, 32671.0, 845179.0, 152809.0, 9679.0, 1720.0, 551.0, 220.0, 95.0, 65.0, 27.0, 20.0, 14.0, 7.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.749755859375, -5.59326171875, -5.436767578125, -5.2802734375, -5.123779296875, -4.96728515625, -4.810791015625, -4.654296875, -4.497802734375, -4.34130859375, -4.184814453125, -4.0283203125, -3.871826171875, -3.71533203125, -3.558837890625, -3.40234375, -3.245849609375, -3.08935546875, -2.932861328125, -2.7763671875, -2.619873046875, -2.46337890625, -2.306884765625, -2.150390625, -1.993896484375, -1.83740234375, -1.680908203125, -1.5244140625, -1.367919921875, -1.21142578125, -1.054931640625, -0.8984375, -0.741943359375, -0.58544921875, -0.428955078125, -0.2724609375, -0.115966796875, 0.04052734375, 0.197021484375, 0.353515625, 0.510009765625, 0.66650390625, 0.822998046875, 0.9794921875, 1.135986328125, 1.29248046875, 1.448974609375, 1.60546875, 1.761962890625, 1.91845703125, 2.074951171875, 2.2314453125, 2.387939453125, 2.54443359375, 2.700927734375, 2.857421875, 3.013916015625, 3.17041015625, 3.326904296875, 3.4833984375, 3.639892578125, 3.79638671875, 3.952880859375, 4.109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 9.0, 16.0, 22.0, 34.0, 35.0, 55.0, 86.0, 107.0, 139.0, 141.0, 105.0, 52.0, 53.0, 37.0, 33.0, 19.0, 11.0, 15.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.799957275390625, -3.68780517578125, -3.575653076171875, -3.4635009765625, -3.351348876953125, -3.23919677734375, -3.127044677734375, -3.014892578125, -2.902740478515625, -2.79058837890625, -2.678436279296875, -2.5662841796875, -2.454132080078125, -2.34197998046875, -2.229827880859375, -2.11767578125, -2.005523681640625, -1.89337158203125, -1.781219482421875, -1.6690673828125, -1.556915283203125, -1.44476318359375, -1.332611083984375, -1.220458984375, -1.108306884765625, -0.99615478515625, -0.884002685546875, -0.7718505859375, -0.659698486328125, -0.54754638671875, -0.435394287109375, -0.3232421875, -0.211090087890625, -0.09893798828125, 0.013214111328125, 0.1253662109375, 0.237518310546875, 0.34967041015625, 0.461822509765625, 0.573974609375, 0.686126708984375, 0.79827880859375, 0.910430908203125, 1.0225830078125, 1.134735107421875, 1.24688720703125, 1.359039306640625, 1.47119140625, 1.583343505859375, 1.69549560546875, 1.807647705078125, 1.9197998046875, 2.031951904296875, 2.14410400390625, 2.256256103515625, 2.368408203125, 2.480560302734375, 2.59271240234375, 2.704864501953125, 2.8170166015625, 2.929168701171875, 3.04132080078125, 3.153472900390625, 3.265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 15.0, 19.0, 12.0, 38.0, 71.0, 120.0, 160.0, 162.0, 166.0, 107.0, 47.0, 37.0, 20.0, 11.0, 4.0, 3.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.06126403808594, -82.25242614746094, -80.44358825683594, -78.63475036621094, -76.82591247558594, -75.01707458496094, -73.20823669433594, -71.39939880371094, -69.59056091308594, -67.78172302246094, -65.97288513183594, -64.16404724121094, -62.35520935058594, -60.54637145996094, -58.73753356933594, -56.92869567871094, -55.1198616027832, -53.3110237121582, -51.5021858215332, -49.6933479309082, -47.8845100402832, -46.0756721496582, -44.26683807373047, -42.45800018310547, -40.64916229248047, -38.84032440185547, -37.03148651123047, -35.22264862060547, -33.41381072998047, -31.60497283935547, -29.7961368560791, -27.9872989654541, -26.17845916748047, -24.36962127685547, -22.56078338623047, -20.75194549560547, -18.94310760498047, -17.13426971435547, -15.325433731079102, -13.516595840454102, -11.707757949829102, -9.898920059204102, -8.090082168579102, -6.281245231628418, -4.472407341003418, -2.663569450378418, -0.8547325134277344, 0.9541053771972656, 2.7629432678222656, 4.571781158447266, 6.380618572235107, 8.18945598602295, 9.99829387664795, 11.80713176727295, 13.615968704223633, 15.424806594848633, 17.233644485473633, 19.042482376098633, 20.851320266723633, 22.66015625, 24.468994140625, 26.27783203125, 28.086669921875, 29.8955078125, 31.704345703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 15.0, 20.0, 21.0, 18.0, 22.0, 35.0, 41.0, 55.0, 66.0, 65.0, 66.0, 82.0, 91.0, 59.0, 55.0, 65.0, 44.0, 36.0, 26.0, 31.0, 19.0, 15.0, 13.0, 11.0, 12.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.64944839477539, -61.10551071166992, -59.56157302856445, -58.017635345458984, -56.473697662353516, -54.92975616455078, -53.38581848144531, -51.841880798339844, -50.297943115234375, -48.754005432128906, -47.21006774902344, -45.66613006591797, -44.1221923828125, -42.57825469970703, -41.03431701660156, -39.49037551879883, -37.946441650390625, -36.402503967285156, -34.85856628417969, -33.31462860107422, -31.770689010620117, -30.22675132751465, -28.68281364440918, -27.138874053955078, -25.59493637084961, -24.05099868774414, -22.507061004638672, -20.963123321533203, -19.4191837310791, -17.875246047973633, -16.331308364868164, -14.787369728088379, -13.243431091308594, -11.699493408203125, -10.15555477142334, -8.611617088317871, -7.067678928375244, -5.523740768432617, -3.9798030853271484, -2.4358644485473633, -0.8919267654418945, 0.6520112752914429, 2.1959493160247803, 3.739887237548828, 5.283825397491455, 6.827763557434082, 8.37170124053955, 9.915639877319336, 11.459577560424805, 13.003515243530273, 14.547453880310059, 16.091392517089844, 17.635330200195312, 19.17926788330078, 20.72320556640625, 22.26714324951172, 23.811080932617188, 25.355018615722656, 26.898956298828125, 28.442893981933594, 29.986833572387695, 31.530771255493164, 33.07470703125, 34.618648529052734, 36.1625862121582]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 17.0, 18.0, 25.0, 38.0, 63.0, 93.0, 151.0, 254.0, 493.0, 1264.0, 4178.0, 237030.0, 3943385.0, 4932.0, 1275.0, 484.0, 230.0, 128.0, 63.0, 48.0, 28.0, 14.0, 11.0, 2.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.84375, -25.2696533203125, -24.695556640625, -24.1214599609375, -23.54736328125, -22.9732666015625, -22.399169921875, -21.8250732421875, -21.2509765625, -20.6768798828125, -20.102783203125, -19.5286865234375, -18.95458984375, -18.3804931640625, -17.806396484375, -17.2322998046875, -16.658203125, -16.0841064453125, -15.510009765625, -14.9359130859375, -14.36181640625, -13.7877197265625, -13.213623046875, -12.6395263671875, -12.0654296875, -11.4913330078125, -10.917236328125, -10.3431396484375, -9.76904296875, -9.1949462890625, -8.620849609375, -8.0467529296875, -7.47265625, -6.8985595703125, -6.324462890625, -5.7503662109375, -5.17626953125, -4.6021728515625, -4.028076171875, -3.4539794921875, -2.8798828125, -2.3057861328125, -1.731689453125, -1.1575927734375, -0.58349609375, -0.0093994140625, 0.564697265625, 1.1387939453125, 1.712890625, 2.2869873046875, 2.861083984375, 3.4351806640625, 4.00927734375, 4.5833740234375, 5.157470703125, 5.7315673828125, 6.3056640625, 6.8797607421875, 7.453857421875, 8.0279541015625, 8.60205078125, 9.1761474609375, 9.750244140625, 10.3243408203125, 10.8984375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 14.0, 13.0, 18.0, 42.0, 97.0, 133.0, 206.0, 184.0, 129.0, 69.0, 36.0, 16.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5625, -6.41204833984375, -6.2615966796875, -6.11114501953125, -5.960693359375, -5.81024169921875, -5.6597900390625, -5.50933837890625, -5.35888671875, -5.20843505859375, -5.0579833984375, -4.90753173828125, -4.757080078125, -4.60662841796875, -4.4561767578125, -4.30572509765625, -4.1552734375, -4.00482177734375, -3.8543701171875, -3.70391845703125, -3.553466796875, -3.40301513671875, -3.2525634765625, -3.10211181640625, -2.95166015625, -2.80120849609375, -2.6507568359375, -2.50030517578125, -2.349853515625, -2.19940185546875, -2.0489501953125, -1.89849853515625, -1.748046875, -1.59759521484375, -1.4471435546875, -1.29669189453125, -1.146240234375, -0.99578857421875, -0.8453369140625, -0.69488525390625, -0.54443359375, -0.39398193359375, -0.2435302734375, -0.09307861328125, 0.057373046875, 0.20782470703125, 0.3582763671875, 0.50872802734375, 0.6591796875, 0.80963134765625, 0.9600830078125, 1.11053466796875, 1.260986328125, 1.41143798828125, 1.5618896484375, 1.71234130859375, 1.86279296875, 2.01324462890625, 2.1636962890625, 2.31414794921875, 2.464599609375, 2.61505126953125, 2.7655029296875, 2.91595458984375, 3.06640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 13.0, 12.0, 17.0, 22.0, 35.0, 25.0, 25.0, 39.0, 67.0, 95.0, 101.0, 127.0, 171.0, 275.0, 404.0, 587.0, 910.0, 1547.0, 2523.0, 4651.0, 9694.0, 34678.0, 4063449.0, 50742.0, 11156.0, 5144.0, 2781.0, 1749.0, 1058.0, 633.0, 430.0, 339.0, 195.0, 128.0, 112.0, 87.0, 74.0, 51.0, 26.0, 24.0, 17.0, 18.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.5234375, -8.2447509765625, -7.966064453125, -7.6873779296875, -7.40869140625, -7.1300048828125, -6.851318359375, -6.5726318359375, -6.2939453125, -6.0152587890625, -5.736572265625, -5.4578857421875, -5.17919921875, -4.9005126953125, -4.621826171875, -4.3431396484375, -4.064453125, -3.7857666015625, -3.507080078125, -3.2283935546875, -2.94970703125, -2.6710205078125, -2.392333984375, -2.1136474609375, -1.8349609375, -1.5562744140625, -1.277587890625, -0.9989013671875, -0.72021484375, -0.4415283203125, -0.162841796875, 0.1158447265625, 0.39453125, 0.6732177734375, 0.951904296875, 1.2305908203125, 1.50927734375, 1.7879638671875, 2.066650390625, 2.3453369140625, 2.6240234375, 2.9027099609375, 3.181396484375, 3.4600830078125, 3.73876953125, 4.0174560546875, 4.296142578125, 4.5748291015625, 4.853515625, 5.1322021484375, 5.410888671875, 5.6895751953125, 5.96826171875, 6.2469482421875, 6.525634765625, 6.8043212890625, 7.0830078125, 7.3616943359375, 7.640380859375, 7.9190673828125, 8.19775390625, 8.4764404296875, 8.755126953125, 9.0338134765625, 9.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 6.0, 6.0, 10.0, 16.0, 34.0, 168.0, 3671.0, 68.0, 36.0, 15.0, 11.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.96649169921875, -4.8079833984375, -4.64947509765625, -4.490966796875, -4.33245849609375, -4.1739501953125, -4.01544189453125, -3.85693359375, -3.69842529296875, -3.5399169921875, -3.38140869140625, -3.222900390625, -3.06439208984375, -2.9058837890625, -2.74737548828125, -2.5888671875, -2.43035888671875, -2.2718505859375, -2.11334228515625, -1.954833984375, -1.79632568359375, -1.6378173828125, -1.47930908203125, -1.32080078125, -1.16229248046875, -1.0037841796875, -0.84527587890625, -0.686767578125, -0.52825927734375, -0.3697509765625, -0.21124267578125, -0.052734375, 0.10577392578125, 0.2642822265625, 0.42279052734375, 0.581298828125, 0.73980712890625, 0.8983154296875, 1.05682373046875, 1.21533203125, 1.37384033203125, 1.5323486328125, 1.69085693359375, 1.849365234375, 2.00787353515625, 2.1663818359375, 2.32489013671875, 2.4833984375, 2.64190673828125, 2.8004150390625, 2.95892333984375, 3.117431640625, 3.27593994140625, 3.4344482421875, 3.59295654296875, 3.75146484375, 3.90997314453125, 4.0684814453125, 4.22698974609375, 4.385498046875, 4.54400634765625, 4.7025146484375, 4.86102294921875, 5.01953125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 9.0, 6.0, 10.0, 12.0, 19.0, 17.0, 27.0, 35.0, 47.0, 64.0, 78.0, 91.0, 96.0, 74.0, 72.0, 63.0, 62.0, 40.0, 30.0, 18.0, 12.0, 13.0, 20.0, 15.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.592257499694824, -9.307798385620117, -9.023338317871094, -8.738879203796387, -8.454419136047363, -8.169960021972656, -7.885500431060791, -7.601040840148926, -7.3165812492370605, -7.032121658325195, -6.74766206741333, -6.463202476501465, -6.178743362426758, -5.894283294677734, -5.609824180603027, -5.325364589691162, -5.040904998779297, -4.756445407867432, -4.471985816955566, -4.187526226043701, -3.903066873550415, -3.61860728263855, -3.3341479301452637, -3.0496883392333984, -2.765228748321533, -2.480769157409668, -2.1963095664978027, -1.9118502140045166, -1.6273906230926514, -1.3429310321807861, -1.0584715604782104, -0.7740120887756348, -0.48955345153808594, -0.20509392023086548, 0.07936561107635498, 0.36382514238357544, 0.6482846736907959, 0.9327442646026611, 1.2172037363052368, 1.5016632080078125, 1.7861227989196777, 2.070582389831543, 2.355041980743408, 2.6395013332366943, 2.9239609241485596, 3.208420515060425, 3.492879867553711, 3.777339458465576, 4.061799049377441, 4.346258640289307, 4.630718231201172, 4.915177822113037, 5.199637413024902, 5.484096527099609, 5.768556118011475, 6.05301570892334, 6.337475299835205, 6.62193489074707, 6.9063944816589355, 7.190854072570801, 7.475313186645508, 7.759773254394531, 8.044232368469238, 8.328691482543945, 8.613151550292969]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 9.0, 16.0, 10.0, 15.0, 27.0, 19.0, 24.0, 36.0, 39.0, 27.0, 46.0, 49.0, 40.0, 53.0, 56.0, 51.0, 58.0, 61.0, 48.0, 49.0, 36.0, 41.0, 34.0, 28.0, 29.0, 16.0, 14.0, 14.0, 12.0, 7.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.650160789489746, -7.321600437164307, -6.993040084838867, -6.664480209350586, -6.3359198570251465, -6.007359504699707, -5.678799629211426, -5.350239276885986, -5.021678924560547, -4.693118572235107, -4.364558219909668, -4.035998344421387, -3.7074379920959473, -3.378877639770508, -3.0503175258636475, -2.721757411956787, -2.3931970596313477, -2.064636707305908, -1.7360765933990479, -1.407516360282898, -1.078956127166748, -0.7503958940505981, -0.42183566093444824, -0.09327554702758789, 0.23528480529785156, 0.5638450384140015, 0.8924052715301514, 1.2209655046463013, 1.5495257377624512, 1.878085970878601, 2.206646203994751, 2.5352063179016113, 2.863767623901367, 3.1923279762268066, 3.520888090133667, 3.8494482040405273, 4.178008556365967, 4.506568908691406, 4.8351287841796875, 5.163689136505127, 5.492249488830566, 5.820809841156006, 6.149370193481445, 6.477930068969727, 6.806490421295166, 7.1350507736206055, 7.463610649108887, 7.792171001434326, 8.120731353759766, 8.449291229248047, 8.777852058410645, 9.106411933898926, 9.434972763061523, 9.763532638549805, 10.092092514038086, 10.420652389526367, 10.749213218688965, 11.077773094177246, 11.406333923339844, 11.734893798828125, 12.063453674316406, 12.392014503479004, 12.720574378967285, 13.049135208129883, 13.377695083618164]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 16.0, 20.0, 24.0, 37.0, 75.0, 100.0, 141.0, 275.0, 440.0, 945.0, 2310.0, 6237.0, 24865.0, 175979.0, 716032.0, 96516.0, 16356.0, 4628.0, 1752.0, 782.0, 407.0, 226.0, 136.0, 83.0, 43.0, 31.0, 17.0, 23.0, 15.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.671875, -8.3765869140625, -8.081298828125, -7.7860107421875, -7.49072265625, -7.1954345703125, -6.900146484375, -6.6048583984375, -6.3095703125, -6.0142822265625, -5.718994140625, -5.4237060546875, -5.12841796875, -4.8331298828125, -4.537841796875, -4.2425537109375, -3.947265625, -3.6519775390625, -3.356689453125, -3.0614013671875, -2.76611328125, -2.4708251953125, -2.175537109375, -1.8802490234375, -1.5849609375, -1.2896728515625, -0.994384765625, -0.6990966796875, -0.40380859375, -0.1085205078125, 0.186767578125, 0.4820556640625, 0.77734375, 1.0726318359375, 1.367919921875, 1.6632080078125, 1.95849609375, 2.2537841796875, 2.549072265625, 2.8443603515625, 3.1396484375, 3.4349365234375, 3.730224609375, 4.0255126953125, 4.32080078125, 4.6160888671875, 4.911376953125, 5.2066650390625, 5.501953125, 5.7972412109375, 6.092529296875, 6.3878173828125, 6.68310546875, 6.9783935546875, 7.273681640625, 7.5689697265625, 7.8642578125, 8.1595458984375, 8.454833984375, 8.7501220703125, 9.04541015625, 9.3406982421875, 9.635986328125, 9.9312744140625, 10.2265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 8.0, 9.0, 19.0, 9.0, 38.0, 52.0, 60.0, 95.0, 111.0, 133.0, 118.0, 106.0, 86.0, 57.0, 34.0, 18.0, 16.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.453765869140625, -4.34112548828125, -4.228485107421875, -4.1158447265625, -4.003204345703125, -3.89056396484375, -3.777923583984375, -3.665283203125, -3.552642822265625, -3.44000244140625, -3.327362060546875, -3.2147216796875, -3.102081298828125, -2.98944091796875, -2.876800537109375, -2.76416015625, -2.651519775390625, -2.53887939453125, -2.426239013671875, -2.3135986328125, -2.200958251953125, -2.08831787109375, -1.975677490234375, -1.863037109375, -1.750396728515625, -1.63775634765625, -1.525115966796875, -1.4124755859375, -1.299835205078125, -1.18719482421875, -1.074554443359375, -0.9619140625, -0.849273681640625, -0.73663330078125, -0.623992919921875, -0.5113525390625, -0.398712158203125, -0.28607177734375, -0.173431396484375, -0.060791015625, 0.051849365234375, 0.16448974609375, 0.277130126953125, 0.3897705078125, 0.502410888671875, 0.61505126953125, 0.727691650390625, 0.84033203125, 0.952972412109375, 1.06561279296875, 1.178253173828125, 1.2908935546875, 1.403533935546875, 1.51617431640625, 1.628814697265625, 1.741455078125, 1.854095458984375, 1.96673583984375, 2.079376220703125, 2.1920166015625, 2.304656982421875, 2.41729736328125, 2.529937744140625, 2.642578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 14.0, 14.0, 22.0, 57.0, 64.0, 112.0, 188.0, 425.0, 971.0, 2596.0, 9127.0, 51313.0, 663415.0, 284894.0, 26185.0, 5811.0, 1858.0, 727.0, 312.0, 171.0, 110.0, 59.0, 25.0, 19.0, 23.0, 9.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -6.935546875, -6.64453125, -6.353515625, -6.0625, -5.771484375, -5.48046875, -5.189453125, -4.8984375, -4.607421875, -4.31640625, -4.025390625, -3.734375, -3.443359375, -3.15234375, -2.861328125, -2.5703125, -2.279296875, -1.98828125, -1.697265625, -1.40625, -1.115234375, -0.82421875, -0.533203125, -0.2421875, 0.048828125, 0.33984375, 0.630859375, 0.921875, 1.212890625, 1.50390625, 1.794921875, 2.0859375, 2.376953125, 2.66796875, 2.958984375, 3.25, 3.541015625, 3.83203125, 4.123046875, 4.4140625, 4.705078125, 4.99609375, 5.287109375, 5.578125, 5.869140625, 6.16015625, 6.451171875, 6.7421875, 7.033203125, 7.32421875, 7.615234375, 7.90625, 8.197265625, 8.48828125, 8.779296875, 9.0703125, 9.361328125, 9.65234375, 9.943359375, 10.234375, 10.525390625, 10.81640625, 11.107421875, 11.3984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 5.0, 8.0, 6.0, 6.0, 14.0, 12.0, 13.0, 20.0, 24.0, 23.0, 29.0, 39.0, 51.0, 39.0, 53.0, 50.0, 52.0, 52.0, 49.0, 49.0, 37.0, 53.0, 48.0, 41.0, 49.0, 39.0, 18.0, 19.0, 15.0, 20.0, 9.0, 10.0, 6.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9140625, -7.65771484375, -7.4013671875, -7.14501953125, -6.888671875, -6.63232421875, -6.3759765625, -6.11962890625, -5.86328125, -5.60693359375, -5.3505859375, -5.09423828125, -4.837890625, -4.58154296875, -4.3251953125, -4.06884765625, -3.8125, -3.55615234375, -3.2998046875, -3.04345703125, -2.787109375, -2.53076171875, -2.2744140625, -2.01806640625, -1.76171875, -1.50537109375, -1.2490234375, -0.99267578125, -0.736328125, -0.47998046875, -0.2236328125, 0.03271484375, 0.2890625, 0.54541015625, 0.8017578125, 1.05810546875, 1.314453125, 1.57080078125, 1.8271484375, 2.08349609375, 2.33984375, 2.59619140625, 2.8525390625, 3.10888671875, 3.365234375, 3.62158203125, 3.8779296875, 4.13427734375, 4.390625, 4.64697265625, 4.9033203125, 5.15966796875, 5.416015625, 5.67236328125, 5.9287109375, 6.18505859375, 6.44140625, 6.69775390625, 6.9541015625, 7.21044921875, 7.466796875, 7.72314453125, 7.9794921875, 8.23583984375, 8.4921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 17.0, 38.0, 53.0, 113.0, 262.0, 679.0, 2848.0, 35391.0, 948779.0, 55400.0, 3633.0, 781.0, 257.0, 132.0, 65.0, 39.0, 19.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.215423583984375, -3.04217529296875, -2.868927001953125, -2.6956787109375, -2.522430419921875, -2.34918212890625, -2.175933837890625, -2.002685546875, -1.829437255859375, -1.65618896484375, -1.482940673828125, -1.3096923828125, -1.136444091796875, -0.96319580078125, -0.789947509765625, -0.61669921875, -0.443450927734375, -0.27020263671875, -0.096954345703125, 0.0762939453125, 0.249542236328125, 0.42279052734375, 0.596038818359375, 0.769287109375, 0.942535400390625, 1.11578369140625, 1.289031982421875, 1.4622802734375, 1.635528564453125, 1.80877685546875, 1.982025146484375, 2.1552734375, 2.328521728515625, 2.50177001953125, 2.675018310546875, 2.8482666015625, 3.021514892578125, 3.19476318359375, 3.368011474609375, 3.541259765625, 3.714508056640625, 3.88775634765625, 4.061004638671875, 4.2342529296875, 4.407501220703125, 4.58074951171875, 4.753997802734375, 4.92724609375, 5.100494384765625, 5.27374267578125, 5.446990966796875, 5.6202392578125, 5.793487548828125, 5.96673583984375, 6.139984130859375, 6.313232421875, 6.486480712890625, 6.65972900390625, 6.832977294921875, 7.0062255859375, 7.179473876953125, 7.35272216796875, 7.525970458984375, 7.69921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 10.0, 19.0, 27.0, 38.0, 72.0, 107.0, 168.0, 171.0, 153.0, 93.0, 50.0, 24.0, 25.0, 15.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.0009245872497558594, -0.0009065326303243637, -0.000888478010892868, -0.0008704233914613724, -0.0008523687720298767, -0.000834314152598381, -0.0008162595331668854, -0.0007982049137353897, -0.000780150294303894, -0.0007620956748723984, -0.0007440410554409027, -0.000725986436009407, -0.0007079318165779114, -0.0006898771971464157, -0.00067182257771492, -0.0006537679582834244, -0.0006357133388519287, -0.000617658719420433, -0.0005996040999889374, -0.0005815494805574417, -0.000563494861125946, -0.0005454402416944504, -0.0005273856222629547, -0.000509331002831459, -0.0004912763833999634, -0.0004732217639684677, -0.00045516714453697205, -0.0004371125251054764, -0.0004190579056739807, -0.00040100328624248505, -0.0003829486668109894, -0.0003648940473794937, -0.00034683942794799805, -0.0003287848085165024, -0.0003107301890850067, -0.00029267556965351105, -0.0002746209502220154, -0.0002565663307905197, -0.00023851171135902405, -0.00022045709192752838, -0.00020240247249603271, -0.00018434785306453705, -0.00016629323363304138, -0.00014823861420154572, -0.00013018399477005005, -0.00011212937533855438, -9.407475590705872e-05, -7.602013647556305e-05, -5.796551704406738e-05, -3.9910897612571716e-05, -2.185627818107605e-05, -3.8016587495803833e-06, 1.4252960681915283e-05, 3.230758011341095e-05, 5.0362199544906616e-05, 6.841681897640228e-05, 8.647143840789795e-05, 0.00010452605783939362, 0.00012258067727088928, 0.00014063529670238495, 0.00015868991613388062, 0.00017674453556537628, 0.00019479915499687195, 0.00021285377442836761, 0.00023090839385986328]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 13.0, 18.0, 49.0, 85.0, 151.0, 281.0, 660.0, 1852.0, 10784.0, 400015.0, 617954.0, 13158.0, 2134.0, 703.0, 286.0, 163.0, 88.0, 50.0, 32.0, 19.0, 13.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.09808349609375, -3.9344482421875, -3.77081298828125, -3.607177734375, -3.44354248046875, -3.2799072265625, -3.11627197265625, -2.95263671875, -2.78900146484375, -2.6253662109375, -2.46173095703125, -2.298095703125, -2.13446044921875, -1.9708251953125, -1.80718994140625, -1.6435546875, -1.47991943359375, -1.3162841796875, -1.15264892578125, -0.989013671875, -0.82537841796875, -0.6617431640625, -0.49810791015625, -0.33447265625, -0.17083740234375, -0.0072021484375, 0.15643310546875, 0.320068359375, 0.48370361328125, 0.6473388671875, 0.81097412109375, 0.974609375, 1.13824462890625, 1.3018798828125, 1.46551513671875, 1.629150390625, 1.79278564453125, 1.9564208984375, 2.12005615234375, 2.28369140625, 2.44732666015625, 2.6109619140625, 2.77459716796875, 2.938232421875, 3.10186767578125, 3.2655029296875, 3.42913818359375, 3.5927734375, 3.75640869140625, 3.9200439453125, 4.08367919921875, 4.247314453125, 4.41094970703125, 4.5745849609375, 4.73822021484375, 4.90185546875, 5.06549072265625, 5.2291259765625, 5.39276123046875, 5.556396484375, 5.72003173828125, 5.8836669921875, 6.04730224609375, 6.2109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 11.0, 29.0, 44.0, 82.0, 143.0, 202.0, 192.0, 144.0, 70.0, 37.0, 20.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.08319091796875, -3.9046630859375, -3.72613525390625, -3.547607421875, -3.36907958984375, -3.1905517578125, -3.01202392578125, -2.83349609375, -2.65496826171875, -2.4764404296875, -2.29791259765625, -2.119384765625, -1.94085693359375, -1.7623291015625, -1.58380126953125, -1.4052734375, -1.22674560546875, -1.0482177734375, -0.86968994140625, -0.691162109375, -0.51263427734375, -0.3341064453125, -0.15557861328125, 0.02294921875, 0.20147705078125, 0.3800048828125, 0.55853271484375, 0.737060546875, 0.91558837890625, 1.0941162109375, 1.27264404296875, 1.451171875, 1.62969970703125, 1.8082275390625, 1.98675537109375, 2.165283203125, 2.34381103515625, 2.5223388671875, 2.70086669921875, 2.87939453125, 3.05792236328125, 3.2364501953125, 3.41497802734375, 3.593505859375, 3.77203369140625, 3.9505615234375, 4.12908935546875, 4.3076171875, 4.48614501953125, 4.6646728515625, 4.84320068359375, 5.021728515625, 5.20025634765625, 5.3787841796875, 5.55731201171875, 5.73583984375, 5.91436767578125, 6.0928955078125, 6.27142333984375, 6.449951171875, 6.62847900390625, 6.8070068359375, 6.98553466796875, 7.1640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 19.0, 33.0, 92.0, 135.0, 223.0, 223.0, 137.0, 63.0, 30.0, 20.0, 13.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.38458251953125, -88.84367370605469, -86.30276489257812, -83.76185607910156, -81.220947265625, -78.68003845214844, -76.13912963867188, -73.59822082519531, -71.05731201171875, -68.51640319824219, -65.97549438476562, -63.43458557128906, -60.8936767578125, -58.35276794433594, -55.81186294555664, -53.27095413208008, -50.73004913330078, -48.18914031982422, -45.648231506347656, -43.107322692871094, -40.56641387939453, -38.02550506591797, -35.48460006713867, -32.94369125366211, -30.402782440185547, -27.861873626708984, -25.320964813232422, -22.780057907104492, -20.23914909362793, -17.698240280151367, -15.157332420349121, -12.616424560546875, -10.075515747070312, -7.534607410430908, -4.993699073791504, -2.4527907371520996, 0.08811759948730469, 2.629026412963867, 5.169934272766113, 7.710842132568359, 10.251750946044922, 12.792659759521484, 15.33356761932373, 17.874475479125977, 20.41538429260254, 22.9562931060791, 25.49720001220703, 28.038108825683594, 30.579017639160156, 33.11992645263672, 35.66083526611328, 38.201744079589844, 40.742652893066406, 43.28356170654297, 45.824466705322266, 48.36537551879883, 50.90628433227539, 53.44719314575195, 55.988101959228516, 58.52901077270508, 61.069915771484375, 63.61082458496094, 66.1517333984375, 68.69264221191406, 71.23355102539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 9.0, 13.0, 9.0, 19.0, 21.0, 29.0, 22.0, 47.0, 30.0, 42.0, 35.0, 41.0, 60.0, 46.0, 64.0, 50.0, 56.0, 48.0, 40.0, 40.0, 36.0, 36.0, 27.0, 26.0, 22.0, 24.0, 16.0, 10.0, 10.0, 8.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.66944885253906, -32.45766830444336, -31.245887756347656, -30.034107208251953, -28.82232666015625, -27.610546112060547, -26.398767471313477, -25.186986923217773, -23.97520637512207, -22.763425827026367, -21.551645278930664, -20.33986473083496, -19.12808609008789, -17.916305541992188, -16.704524993896484, -15.492744445800781, -14.280963897705078, -13.069183349609375, -11.857402801513672, -10.645623207092285, -9.433842658996582, -8.222062110900879, -7.010282039642334, -5.798501968383789, -4.586721420288086, -3.374941110610962, -2.163160800933838, -0.9513804912567139, 0.26039981842041016, 1.4721803665161133, 2.683960437774658, 3.895740509033203, 5.107517242431641, 6.319297790527344, 7.531077861785889, 8.742857933044434, 9.954638481140137, 11.16641902923584, 12.378198623657227, 13.58997917175293, 14.801759719848633, 16.013540267944336, 17.22532081604004, 18.437101364135742, 19.648880004882812, 20.860660552978516, 22.07244110107422, 23.284221649169922, 24.496002197265625, 25.707782745361328, 26.91956329345703, 28.131343841552734, 29.343124389648438, 30.55490493774414, 31.76668357849121, 32.97846221923828, 34.19024658203125, 35.40202713012695, 36.613807678222656, 37.82558822631836, 39.03736877441406, 40.249149322509766, 41.46092987060547, 42.672706604003906, 43.88448715209961]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 20.0, 25.0, 33.0, 52.0, 64.0, 108.0, 139.0, 211.0, 321.0, 476.0, 753.0, 1224.0, 2244.0, 3945.0, 7834.0, 17937.0, 54871.0, 661695.0, 3295261.0, 98078.0, 26706.0, 10828.0, 5038.0, 2603.0, 1479.0, 854.0, 525.0, 298.0, 221.0, 156.0, 74.0, 51.0, 53.0, 20.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.99609375, -3.871917724609375, -3.74774169921875, -3.623565673828125, -3.4993896484375, -3.375213623046875, -3.25103759765625, -3.126861572265625, -3.002685546875, -2.878509521484375, -2.75433349609375, -2.630157470703125, -2.5059814453125, -2.381805419921875, -2.25762939453125, -2.133453369140625, -2.00927734375, -1.885101318359375, -1.76092529296875, -1.636749267578125, -1.5125732421875, -1.388397216796875, -1.26422119140625, -1.140045166015625, -1.015869140625, -0.891693115234375, -0.76751708984375, -0.643341064453125, -0.5191650390625, -0.394989013671875, -0.27081298828125, -0.146636962890625, -0.0224609375, 0.101715087890625, 0.22589111328125, 0.350067138671875, 0.4742431640625, 0.598419189453125, 0.72259521484375, 0.846771240234375, 0.970947265625, 1.095123291015625, 1.21929931640625, 1.343475341796875, 1.4676513671875, 1.591827392578125, 1.71600341796875, 1.840179443359375, 1.96435546875, 2.088531494140625, 2.21270751953125, 2.336883544921875, 2.4610595703125, 2.585235595703125, 2.70941162109375, 2.833587646484375, 2.957763671875, 3.081939697265625, 3.20611572265625, 3.330291748046875, 3.4544677734375, 3.578643798828125, 3.70281982421875, 3.826995849609375, 3.951171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 8.0, 9.0, 10.0, 13.0, 12.0, 23.0, 19.0, 36.0, 35.0, 46.0, 57.0, 70.0, 48.0, 80.0, 81.0, 68.0, 61.0, 65.0, 50.0, 39.0, 33.0, 22.0, 24.0, 15.0, 15.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.510955810546875, -1.45550537109375, -1.400054931640625, -1.3446044921875, -1.289154052734375, -1.23370361328125, -1.178253173828125, -1.122802734375, -1.067352294921875, -1.01190185546875, -0.956451416015625, -0.9010009765625, -0.845550537109375, -0.79010009765625, -0.734649658203125, -0.67919921875, -0.623748779296875, -0.56829833984375, -0.512847900390625, -0.4573974609375, -0.401947021484375, -0.34649658203125, -0.291046142578125, -0.235595703125, -0.180145263671875, -0.12469482421875, -0.069244384765625, -0.0137939453125, 0.041656494140625, 0.09710693359375, 0.152557373046875, 0.2080078125, 0.263458251953125, 0.31890869140625, 0.374359130859375, 0.4298095703125, 0.485260009765625, 0.54071044921875, 0.596160888671875, 0.651611328125, 0.707061767578125, 0.76251220703125, 0.817962646484375, 0.8734130859375, 0.928863525390625, 0.98431396484375, 1.039764404296875, 1.09521484375, 1.150665283203125, 1.20611572265625, 1.261566162109375, 1.3170166015625, 1.372467041015625, 1.42791748046875, 1.483367919921875, 1.538818359375, 1.594268798828125, 1.64971923828125, 1.705169677734375, 1.7606201171875, 1.816070556640625, 1.87152099609375, 1.926971435546875, 1.982421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 14.0, 24.0, 63.0, 120.0, 335.0, 909.0, 3276.0, 15390.0, 135555.0, 3893901.0, 125258.0, 14817.0, 3184.0, 848.0, 307.0, 138.0, 58.0, 38.0, 24.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.6953125, -10.4375, -10.1796875, -9.921875, -9.6640625, -9.40625, -9.1484375, -8.890625, -8.6328125, -8.375, -8.1171875, -7.859375, -7.6015625, -7.34375, -7.0859375, -6.828125, -6.5703125, -6.3125, -6.0546875, -5.796875, -5.5390625, -5.28125, -5.0234375, -4.765625, -4.5078125, -4.25, -3.9921875, -3.734375, -3.4765625, -3.21875, -2.9609375, -2.703125, -2.4453125, -2.1875, -1.9296875, -1.671875, -1.4140625, -1.15625, -0.8984375, -0.640625, -0.3828125, -0.125, 0.1328125, 0.390625, 0.6484375, 0.90625, 1.1640625, 1.421875, 1.6796875, 1.9375, 2.1953125, 2.453125, 2.7109375, 2.96875, 3.2265625, 3.484375, 3.7421875, 4.0, 4.2578125, 4.515625, 4.7734375, 5.03125, 5.2890625, 5.546875, 5.8046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 16.0, 29.0, 46.0, 43.0, 89.0, 141.0, 359.0, 1616.0, 1054.0, 274.0, 136.0, 74.0, 54.0, 35.0, 20.0, 21.0, 18.0, 9.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.75836181640625, -5.5440673828125, -5.32977294921875, -5.115478515625, -4.90118408203125, -4.6868896484375, -4.47259521484375, -4.25830078125, -4.04400634765625, -3.8297119140625, -3.61541748046875, -3.401123046875, -3.18682861328125, -2.9725341796875, -2.75823974609375, -2.5439453125, -2.32965087890625, -2.1153564453125, -1.90106201171875, -1.686767578125, -1.47247314453125, -1.2581787109375, -1.04388427734375, -0.82958984375, -0.61529541015625, -0.4010009765625, -0.18670654296875, 0.027587890625, 0.24188232421875, 0.4561767578125, 0.67047119140625, 0.884765625, 1.09906005859375, 1.3133544921875, 1.52764892578125, 1.741943359375, 1.95623779296875, 2.1705322265625, 2.38482666015625, 2.59912109375, 2.81341552734375, 3.0277099609375, 3.24200439453125, 3.456298828125, 3.67059326171875, 3.8848876953125, 4.09918212890625, 4.3134765625, 4.52777099609375, 4.7420654296875, 4.95635986328125, 5.170654296875, 5.38494873046875, 5.5992431640625, 5.81353759765625, 6.02783203125, 6.24212646484375, 6.4564208984375, 6.67071533203125, 6.885009765625, 7.09930419921875, 7.3135986328125, 7.52789306640625, 7.7421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 13.0, 30.0, 37.0, 65.0, 138.0, 219.0, 175.0, 119.0, 72.0, 50.0, 23.0, 14.0, 5.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.504051208496094, -51.117774963378906, -49.73149871826172, -48.34522247314453, -46.958946228027344, -45.572669982910156, -44.18639373779297, -42.80011749267578, -41.413841247558594, -40.027565002441406, -38.64128875732422, -37.25501251220703, -35.868736267089844, -34.482460021972656, -33.09618377685547, -31.70990753173828, -30.323633193969727, -28.93735694885254, -27.55108070373535, -26.164804458618164, -24.778528213500977, -23.39225196838379, -22.005977630615234, -20.619701385498047, -19.23342514038086, -17.847148895263672, -16.460872650146484, -15.074596405029297, -13.68832015991211, -12.302043914794922, -10.91576862335205, -9.529492378234863, -8.14321517944336, -6.756938934326172, -5.370662689208984, -3.984386920928955, -2.5981106758117676, -1.21183443069458, 0.17444133758544922, 1.5607175827026367, 2.946993827819824, 4.333270072937012, 5.719546318054199, 7.1058220863342285, 8.492097854614258, 9.878374099731445, 11.264650344848633, 12.65092658996582, 14.037202835083008, 15.423479080200195, 16.809755325317383, 18.19603157043457, 19.582307815551758, 20.968584060668945, 22.3548583984375, 23.741134643554688, 25.127410888671875, 26.513687133789062, 27.89996337890625, 29.286239624023438, 30.672515869140625, 32.05879211425781, 33.445068359375, 34.83134460449219, 36.217620849609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 10.0, 18.0, 13.0, 23.0, 25.0, 28.0, 31.0, 26.0, 26.0, 49.0, 35.0, 39.0, 46.0, 50.0, 43.0, 57.0, 67.0, 28.0, 39.0, 36.0, 32.0, 31.0, 30.0, 26.0, 23.0, 24.0, 30.0, 12.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.306528091430664, -18.70243263244629, -18.09833526611328, -17.494239807128906, -16.89014434814453, -16.286046981811523, -15.681951522827148, -15.077855110168457, -14.473758697509766, -13.869662284851074, -13.265565872192383, -12.661470413208008, -12.057374000549316, -11.453277587890625, -10.84918212890625, -10.245085716247559, -9.640989303588867, -9.036892890930176, -8.432796478271484, -7.828701019287109, -7.224604606628418, -6.620508193969727, -6.016412258148193, -5.41231632232666, -4.808219909667969, -4.204123497009277, -3.600027561187744, -2.995931386947632, -2.3918352127075195, -1.7877390384674072, -1.183642864227295, -0.5795469284057617, 0.0245513916015625, 0.6286475658416748, 1.232743740081787, 1.8368399143218994, 2.4409360885620117, 3.045032262802124, 3.6491284370422363, 4.2532243728637695, 4.857320785522461, 5.461417198181152, 6.0655131340026855, 6.669609069824219, 7.27370548248291, 7.877801895141602, 8.481897354125977, 9.085993766784668, 9.69009017944336, 10.29418659210205, 10.898283004760742, 11.502378463745117, 12.106474876403809, 12.7105712890625, 13.314666748046875, 13.918763160705566, 14.522859573364258, 15.12695598602295, 15.73105239868164, 16.335147857666016, 16.93924331665039, 17.5433406829834, 18.147436141967773, 18.75153350830078, 19.355628967285156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 13.0, 34.0, 52.0, 64.0, 120.0, 220.0, 396.0, 707.0, 1402.0, 2823.0, 6877.0, 19235.0, 66128.0, 303369.0, 492676.0, 108556.0, 28667.0, 9642.0, 3800.0, 1733.0, 940.0, 463.0, 248.0, 147.0, 77.0, 57.0, 35.0, 16.0, 15.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -5.0091552734375, -4.858154296875, -4.7071533203125, -4.55615234375, -4.4051513671875, -4.254150390625, -4.1031494140625, -3.9521484375, -3.8011474609375, -3.650146484375, -3.4991455078125, -3.34814453125, -3.1971435546875, -3.046142578125, -2.8951416015625, -2.744140625, -2.5931396484375, -2.442138671875, -2.2911376953125, -2.14013671875, -1.9891357421875, -1.838134765625, -1.6871337890625, -1.5361328125, -1.3851318359375, -1.234130859375, -1.0831298828125, -0.93212890625, -0.7811279296875, -0.630126953125, -0.4791259765625, -0.328125, -0.1771240234375, -0.026123046875, 0.1248779296875, 0.27587890625, 0.4268798828125, 0.577880859375, 0.7288818359375, 0.8798828125, 1.0308837890625, 1.181884765625, 1.3328857421875, 1.48388671875, 1.6348876953125, 1.785888671875, 1.9368896484375, 2.087890625, 2.2388916015625, 2.389892578125, 2.5408935546875, 2.69189453125, 2.8428955078125, 2.993896484375, 3.1448974609375, 3.2958984375, 3.4468994140625, 3.597900390625, 3.7489013671875, 3.89990234375, 4.0509033203125, 4.201904296875, 4.3529052734375, 4.50390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 5.0, 11.0, 16.0, 33.0, 34.0, 44.0, 42.0, 49.0, 66.0, 63.0, 83.0, 74.0, 76.0, 67.0, 66.0, 48.0, 46.0, 32.0, 30.0, 29.0, 21.0, 20.0, 11.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.767578125, -1.709686279296875, -1.65179443359375, -1.593902587890625, -1.5360107421875, -1.478118896484375, -1.42022705078125, -1.362335205078125, -1.304443359375, -1.246551513671875, -1.18865966796875, -1.130767822265625, -1.0728759765625, -1.014984130859375, -0.95709228515625, -0.899200439453125, -0.84130859375, -0.783416748046875, -0.72552490234375, -0.667633056640625, -0.6097412109375, -0.551849365234375, -0.49395751953125, -0.436065673828125, -0.378173828125, -0.320281982421875, -0.26239013671875, -0.204498291015625, -0.1466064453125, -0.088714599609375, -0.03082275390625, 0.027069091796875, 0.0849609375, 0.142852783203125, 0.20074462890625, 0.258636474609375, 0.3165283203125, 0.374420166015625, 0.43231201171875, 0.490203857421875, 0.548095703125, 0.605987548828125, 0.66387939453125, 0.721771240234375, 0.7796630859375, 0.837554931640625, 0.89544677734375, 0.953338623046875, 1.01123046875, 1.069122314453125, 1.12701416015625, 1.184906005859375, 1.2427978515625, 1.300689697265625, 1.35858154296875, 1.416473388671875, 1.474365234375, 1.532257080078125, 1.59014892578125, 1.648040771484375, 1.7059326171875, 1.763824462890625, 1.82171630859375, 1.879608154296875, 1.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 15.0, 24.0, 26.0, 48.0, 56.0, 74.0, 134.0, 197.0, 401.0, 783.0, 1695.0, 4312.0, 15682.0, 103588.0, 765126.0, 130143.0, 17943.0, 4688.0, 1649.0, 839.0, 444.0, 228.0, 161.0, 96.0, 56.0, 43.0, 22.0, 19.0, 9.0, 10.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.32305908203125, -7.1226806640625, -6.92230224609375, -6.721923828125, -6.52154541015625, -6.3211669921875, -6.12078857421875, -5.92041015625, -5.72003173828125, -5.5196533203125, -5.31927490234375, -5.118896484375, -4.91851806640625, -4.7181396484375, -4.51776123046875, -4.3173828125, -4.11700439453125, -3.9166259765625, -3.71624755859375, -3.515869140625, -3.31549072265625, -3.1151123046875, -2.91473388671875, -2.71435546875, -2.51397705078125, -2.3135986328125, -2.11322021484375, -1.912841796875, -1.71246337890625, -1.5120849609375, -1.31170654296875, -1.111328125, -0.91094970703125, -0.7105712890625, -0.51019287109375, -0.309814453125, -0.10943603515625, 0.0909423828125, 0.29132080078125, 0.49169921875, 0.69207763671875, 0.8924560546875, 1.09283447265625, 1.293212890625, 1.49359130859375, 1.6939697265625, 1.89434814453125, 2.0947265625, 2.29510498046875, 2.4954833984375, 2.69586181640625, 2.896240234375, 3.09661865234375, 3.2969970703125, 3.49737548828125, 3.69775390625, 3.89813232421875, 4.0985107421875, 4.29888916015625, 4.499267578125, 4.69964599609375, 4.9000244140625, 5.10040283203125, 5.30078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 10.0, 11.0, 22.0, 26.0, 20.0, 33.0, 42.0, 39.0, 53.0, 53.0, 59.0, 61.0, 62.0, 62.0, 53.0, 62.0, 58.0, 52.0, 38.0, 28.0, 23.0, 23.0, 15.0, 21.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.14306640625, -6.9267578125, -6.71044921875, -6.494140625, -6.27783203125, -6.0615234375, -5.84521484375, -5.62890625, -5.41259765625, -5.1962890625, -4.97998046875, -4.763671875, -4.54736328125, -4.3310546875, -4.11474609375, -3.8984375, -3.68212890625, -3.4658203125, -3.24951171875, -3.033203125, -2.81689453125, -2.6005859375, -2.38427734375, -2.16796875, -1.95166015625, -1.7353515625, -1.51904296875, -1.302734375, -1.08642578125, -0.8701171875, -0.65380859375, -0.4375, -0.22119140625, -0.0048828125, 0.21142578125, 0.427734375, 0.64404296875, 0.8603515625, 1.07666015625, 1.29296875, 1.50927734375, 1.7255859375, 1.94189453125, 2.158203125, 2.37451171875, 2.5908203125, 2.80712890625, 3.0234375, 3.23974609375, 3.4560546875, 3.67236328125, 3.888671875, 4.10498046875, 4.3212890625, 4.53759765625, 4.75390625, 4.97021484375, 5.1865234375, 5.40283203125, 5.619140625, 5.83544921875, 6.0517578125, 6.26806640625, 6.484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 10.0, 22.0, 15.0, 52.0, 60.0, 148.0, 324.0, 804.0, 2624.0, 17437.0, 835336.0, 180916.0, 8089.0, 1628.0, 566.0, 241.0, 110.0, 58.0, 37.0, 25.0, 10.0, 8.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.078125, -5.90362548828125, -5.7291259765625, -5.55462646484375, -5.380126953125, -5.20562744140625, -5.0311279296875, -4.85662841796875, -4.68212890625, -4.50762939453125, -4.3331298828125, -4.15863037109375, -3.984130859375, -3.80963134765625, -3.6351318359375, -3.46063232421875, -3.2861328125, -3.11163330078125, -2.9371337890625, -2.76263427734375, -2.588134765625, -2.41363525390625, -2.2391357421875, -2.06463623046875, -1.89013671875, -1.71563720703125, -1.5411376953125, -1.36663818359375, -1.192138671875, -1.01763916015625, -0.8431396484375, -0.66864013671875, -0.494140625, -0.31964111328125, -0.1451416015625, 0.02935791015625, 0.203857421875, 0.37835693359375, 0.5528564453125, 0.72735595703125, 0.90185546875, 1.07635498046875, 1.2508544921875, 1.42535400390625, 1.599853515625, 1.77435302734375, 1.9488525390625, 2.12335205078125, 2.2978515625, 2.47235107421875, 2.6468505859375, 2.82135009765625, 2.995849609375, 3.17034912109375, 3.3448486328125, 3.51934814453125, 3.69384765625, 3.86834716796875, 4.0428466796875, 4.21734619140625, 4.391845703125, 4.56634521484375, 4.7408447265625, 4.91534423828125, 5.08984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 9.0, 10.0, 22.0, 38.0, 48.0, 69.0, 126.0, 172.0, 194.0, 112.0, 58.0, 48.0, 25.0, 21.0, 9.0, 8.0, 8.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00043010711669921875, -0.00040959566831588745, -0.00038908421993255615, -0.00036857277154922485, -0.00034806132316589355, -0.00032754987478256226, -0.00030703842639923096, -0.00028652697801589966, -0.00026601552963256836, -0.00024550408124923706, -0.00022499263286590576, -0.00020448118448257446, -0.00018396973609924316, -0.00016345828771591187, -0.00014294683933258057, -0.00012243539094924927, -0.00010192394256591797, -8.141249418258667e-05, -6.090104579925537e-05, -4.038959741592407e-05, -1.9878149032592773e-05, 6.332993507385254e-07, 2.1144747734069824e-05, 4.165619611740112e-05, 6.216764450073242e-05, 8.267909288406372e-05, 0.00010319054126739502, 0.00012370198965072632, 0.00014421343803405762, 0.00016472488641738892, 0.00018523633480072021, 0.00020574778318405151, 0.0002262592315673828, 0.0002467706799507141, 0.0002672821283340454, 0.0002877935767173767, 0.000308305025100708, 0.0003288164734840393, 0.0003493279218673706, 0.0003698393702507019, 0.0003903508186340332, 0.0004108622670173645, 0.0004313737154006958, 0.0004518851637840271, 0.0004723966121673584, 0.0004929080605506897, 0.000513419508934021, 0.0005339309573173523, 0.0005544424057006836, 0.0005749538540840149, 0.0005954653024673462, 0.0006159767508506775, 0.0006364881992340088, 0.0006569996476173401, 0.0006775110960006714, 0.0006980225443840027, 0.000718533992767334, 0.0007390454411506653, 0.0007595568895339966, 0.0007800683379173279, 0.0008005797863006592, 0.0008210912346839905, 0.0008416026830673218, 0.0008621141314506531, 0.0008826255798339844]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 5.0, 6.0, 4.0, 15.0, 11.0, 41.0, 42.0, 56.0, 104.0, 191.0, 383.0, 904.0, 2487.0, 10165.0, 125963.0, 858724.0, 40952.0, 5546.0, 1589.0, 615.0, 280.0, 170.0, 100.0, 62.0, 39.0, 29.0, 17.0, 15.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.18359375, -5.055023193359375, -4.92645263671875, -4.797882080078125, -4.6693115234375, -4.540740966796875, -4.41217041015625, -4.283599853515625, -4.155029296875, -4.026458740234375, -3.89788818359375, -3.769317626953125, -3.6407470703125, -3.512176513671875, -3.38360595703125, -3.255035400390625, -3.12646484375, -2.997894287109375, -2.86932373046875, -2.740753173828125, -2.6121826171875, -2.483612060546875, -2.35504150390625, -2.226470947265625, -2.097900390625, -1.969329833984375, -1.84075927734375, -1.712188720703125, -1.5836181640625, -1.455047607421875, -1.32647705078125, -1.197906494140625, -1.0693359375, -0.940765380859375, -0.81219482421875, -0.683624267578125, -0.5550537109375, -0.426483154296875, -0.29791259765625, -0.169342041015625, -0.040771484375, 0.087799072265625, 0.21636962890625, 0.344940185546875, 0.4735107421875, 0.602081298828125, 0.73065185546875, 0.859222412109375, 0.98779296875, 1.116363525390625, 1.24493408203125, 1.373504638671875, 1.5020751953125, 1.630645751953125, 1.75921630859375, 1.887786865234375, 2.016357421875, 2.144927978515625, 2.27349853515625, 2.402069091796875, 2.5306396484375, 2.659210205078125, 2.78778076171875, 2.916351318359375, 3.044921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 8.0, 14.0, 25.0, 24.0, 32.0, 29.0, 55.0, 63.0, 96.0, 114.0, 115.0, 90.0, 87.0, 48.0, 38.0, 26.0, 25.0, 25.0, 15.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.7394866943359375, -3.648895263671875, -3.5583038330078125, -3.46771240234375, -3.3771209716796875, -3.286529541015625, -3.1959381103515625, -3.1053466796875, -3.0147552490234375, -2.924163818359375, -2.8335723876953125, -2.74298095703125, -2.6523895263671875, -2.561798095703125, -2.4712066650390625, -2.380615234375, -2.2900238037109375, -2.199432373046875, -2.1088409423828125, -2.01824951171875, -1.9276580810546875, -1.837066650390625, -1.7464752197265625, -1.6558837890625, -1.5652923583984375, -1.474700927734375, -1.3841094970703125, -1.29351806640625, -1.2029266357421875, -1.112335205078125, -1.0217437744140625, -0.93115234375, -0.8405609130859375, -0.749969482421875, -0.6593780517578125, -0.56878662109375, -0.4781951904296875, -0.387603759765625, -0.2970123291015625, -0.2064208984375, -0.1158294677734375, -0.025238037109375, 0.0653533935546875, 0.15594482421875, 0.2465362548828125, 0.337127685546875, 0.4277191162109375, 0.518310546875, 0.6089019775390625, 0.699493408203125, 0.7900848388671875, 0.88067626953125, 0.9712677001953125, 1.061859130859375, 1.1524505615234375, 1.2430419921875, 1.3336334228515625, 1.424224853515625, 1.5148162841796875, 1.60540771484375, 1.6959991455078125, 1.786590576171875, 1.8771820068359375, 1.9677734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 64.0, 141.0, 268.0, 246.0, 126.0, 55.0, 20.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.88066101074219, -81.82772064208984, -79.77478790283203, -77.72184753417969, -75.66891479492188, -73.61597442626953, -71.56303405761719, -69.51010131835938, -67.45716094970703, -65.40422058105469, -63.351287841796875, -61.29834747314453, -59.24541091918945, -57.192474365234375, -55.13953399658203, -53.08659744262695, -51.033660888671875, -48.9807243347168, -46.92778778076172, -44.874847412109375, -42.8219108581543, -40.76897430419922, -38.716033935546875, -36.6630973815918, -34.61016082763672, -32.55722427368164, -30.50428581237793, -28.45134735107422, -26.39841079711914, -24.345474243164062, -22.29253578186035, -20.23959732055664, -18.18665313720703, -16.133716583251953, -14.080778121948242, -12.027840614318848, -9.974903106689453, -7.921965599060059, -5.869028091430664, -3.8160905838012695, -1.763153076171875, 0.28978443145751953, 2.342721939086914, 4.395659446716309, 6.448596954345703, 8.501534461975098, 10.554471969604492, 12.607409477233887, 14.660346984863281, 16.71328353881836, 18.76622200012207, 20.81916046142578, 22.87209701538086, 24.925033569335938, 26.97797203063965, 29.03091049194336, 31.083847045898438, 33.136783599853516, 35.189720153808594, 37.24266052246094, 39.295597076416016, 41.348533630371094, 43.40147399902344, 45.454410552978516, 47.507347106933594]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 7.0, 10.0, 8.0, 30.0, 25.0, 24.0, 31.0, 38.0, 65.0, 62.0, 70.0, 79.0, 74.0, 66.0, 55.0, 58.0, 58.0, 49.0, 27.0, 30.0, 21.0, 24.0, 13.0, 16.0, 15.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-40.44575500488281, -39.4511604309082, -38.456565856933594, -37.46196746826172, -36.46737289428711, -35.4727783203125, -34.47818374633789, -33.48358917236328, -32.488990783691406, -31.494396209716797, -30.499799728393555, -29.505205154418945, -28.510608673095703, -27.516014099121094, -26.521419525146484, -25.526824951171875, -24.532230377197266, -23.537635803222656, -22.543039321899414, -21.548444747924805, -20.553848266601562, -19.559253692626953, -18.564659118652344, -17.570064544677734, -16.575468063354492, -15.580872535705566, -14.58627700805664, -13.591682434082031, -12.597086906433105, -11.60249137878418, -10.60789680480957, -9.613301277160645, -8.618705749511719, -7.624110221862793, -6.629515171051025, -5.634920120239258, -4.640324592590332, -3.6457290649414062, -2.6511340141296387, -1.656538963317871, -0.6619434356689453, 0.33265185356140137, 1.327247142791748, 2.3218424320220947, 3.3164377212524414, 4.311033248901367, 5.305628299713135, 6.300223350524902, 7.294818878173828, 8.289414405822754, 9.28400993347168, 10.278604507446289, 11.273200035095215, 12.26779556274414, 13.26239013671875, 14.256985664367676, 15.251581192016602, 16.24617576599121, 17.240772247314453, 18.235366821289062, 19.229961395263672, 20.224557876586914, 21.219152450561523, 22.213748931884766, 23.208343505859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 13.0, 4.0, 9.0, 15.0, 12.0, 17.0, 37.0, 37.0, 56.0, 84.0, 111.0, 157.0, 226.0, 293.0, 471.0, 732.0, 1260.0, 2121.0, 4267.0, 8944.0, 22696.0, 97100.0, 3234350.0, 730437.0, 58387.0, 17422.0, 7313.0, 3389.0, 1766.0, 927.0, 618.0, 343.0, 206.0, 139.0, 96.0, 68.0, 39.0, 28.0, 25.0, 16.0, 13.0, 7.0, 11.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0], "bins": [-3.44140625, -3.350433349609375, -3.25946044921875, -3.168487548828125, -3.0775146484375, -2.986541748046875, -2.89556884765625, -2.804595947265625, -2.713623046875, -2.622650146484375, -2.53167724609375, -2.440704345703125, -2.3497314453125, -2.258758544921875, -2.16778564453125, -2.076812744140625, -1.98583984375, -1.894866943359375, -1.80389404296875, -1.712921142578125, -1.6219482421875, -1.530975341796875, -1.44000244140625, -1.349029541015625, -1.258056640625, -1.167083740234375, -1.07611083984375, -0.985137939453125, -0.8941650390625, -0.803192138671875, -0.71221923828125, -0.621246337890625, -0.5302734375, -0.439300537109375, -0.34832763671875, -0.257354736328125, -0.1663818359375, -0.075408935546875, 0.01556396484375, 0.106536865234375, 0.197509765625, 0.288482666015625, 0.37945556640625, 0.470428466796875, 0.5614013671875, 0.652374267578125, 0.74334716796875, 0.834320068359375, 0.92529296875, 1.016265869140625, 1.10723876953125, 1.198211669921875, 1.2891845703125, 1.380157470703125, 1.47113037109375, 1.562103271484375, 1.653076171875, 1.744049072265625, 1.83502197265625, 1.925994873046875, 2.0169677734375, 2.107940673828125, 2.19891357421875, 2.289886474609375, 2.380859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 12.0, 16.0, 29.0, 54.0, 59.0, 82.0, 100.0, 95.0, 109.0, 114.0, 87.0, 59.0, 48.0, 41.0, 30.0, 20.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.2507781982421875, -3.175384521484375, -3.0999908447265625, -3.02459716796875, -2.9492034912109375, -2.873809814453125, -2.7984161376953125, -2.7230224609375, -2.6476287841796875, -2.572235107421875, -2.4968414306640625, -2.42144775390625, -2.3460540771484375, -2.270660400390625, -2.1952667236328125, -2.119873046875, -2.0444793701171875, -1.969085693359375, -1.8936920166015625, -1.81829833984375, -1.7429046630859375, -1.667510986328125, -1.5921173095703125, -1.5167236328125, -1.4413299560546875, -1.365936279296875, -1.2905426025390625, -1.21514892578125, -1.1397552490234375, -1.064361572265625, -0.9889678955078125, -0.91357421875, -0.8381805419921875, -0.762786865234375, -0.6873931884765625, -0.61199951171875, -0.5366058349609375, -0.461212158203125, -0.3858184814453125, -0.3104248046875, -0.2350311279296875, -0.159637451171875, -0.0842437744140625, -0.00885009765625, 0.0665435791015625, 0.141937255859375, 0.2173309326171875, 0.292724609375, 0.3681182861328125, 0.443511962890625, 0.5189056396484375, 0.59429931640625, 0.6696929931640625, 0.745086669921875, 0.8204803466796875, 0.8958740234375, 0.9712677001953125, 1.046661376953125, 1.1220550537109375, 1.19744873046875, 1.2728424072265625, 1.348236083984375, 1.4236297607421875, 1.4990234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 24.0, 26.0, 44.0, 62.0, 98.0, 161.0, 311.0, 590.0, 1159.0, 2337.0, 5161.0, 12445.0, 35346.0, 158156.0, 3372465.0, 510553.0, 63027.0, 18662.0, 7044.0, 3257.0, 1615.0, 761.0, 402.0, 240.0, 127.0, 80.0, 34.0, 32.0, 23.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.401885986328125, -3.29791259765625, -3.193939208984375, -3.0899658203125, -2.985992431640625, -2.88201904296875, -2.778045654296875, -2.674072265625, -2.570098876953125, -2.46612548828125, -2.362152099609375, -2.2581787109375, -2.154205322265625, -2.05023193359375, -1.946258544921875, -1.84228515625, -1.738311767578125, -1.63433837890625, -1.530364990234375, -1.4263916015625, -1.322418212890625, -1.21844482421875, -1.114471435546875, -1.010498046875, -0.906524658203125, -0.80255126953125, -0.698577880859375, -0.5946044921875, -0.490631103515625, -0.38665771484375, -0.282684326171875, -0.1787109375, -0.074737548828125, 0.02923583984375, 0.133209228515625, 0.2371826171875, 0.341156005859375, 0.44512939453125, 0.549102783203125, 0.653076171875, 0.757049560546875, 0.86102294921875, 0.964996337890625, 1.0689697265625, 1.172943115234375, 1.27691650390625, 1.380889892578125, 1.48486328125, 1.588836669921875, 1.69281005859375, 1.796783447265625, 1.9007568359375, 2.004730224609375, 2.10870361328125, 2.212677001953125, 2.316650390625, 2.420623779296875, 2.52459716796875, 2.628570556640625, 2.7325439453125, 2.836517333984375, 2.94049072265625, 3.044464111328125, 3.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 8.0, 9.0, 17.0, 12.0, 28.0, 34.0, 36.0, 52.0, 57.0, 150.0, 263.0, 605.0, 1218.0, 702.0, 343.0, 148.0, 98.0, 61.0, 49.0, 30.0, 32.0, 22.0, 8.0, 10.0, 9.0, 4.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.095367431640625, -2.99737548828125, -2.899383544921875, -2.8013916015625, -2.703399658203125, -2.60540771484375, -2.507415771484375, -2.409423828125, -2.311431884765625, -2.21343994140625, -2.115447998046875, -2.0174560546875, -1.919464111328125, -1.82147216796875, -1.723480224609375, -1.62548828125, -1.527496337890625, -1.42950439453125, -1.331512451171875, -1.2335205078125, -1.135528564453125, -1.03753662109375, -0.939544677734375, -0.841552734375, -0.743560791015625, -0.64556884765625, -0.547576904296875, -0.4495849609375, -0.351593017578125, -0.25360107421875, -0.155609130859375, -0.0576171875, 0.040374755859375, 0.13836669921875, 0.236358642578125, 0.3343505859375, 0.432342529296875, 0.53033447265625, 0.628326416015625, 0.726318359375, 0.824310302734375, 0.92230224609375, 1.020294189453125, 1.1182861328125, 1.216278076171875, 1.31427001953125, 1.412261962890625, 1.51025390625, 1.608245849609375, 1.70623779296875, 1.804229736328125, 1.9022216796875, 2.000213623046875, 2.09820556640625, 2.196197509765625, 2.294189453125, 2.392181396484375, 2.49017333984375, 2.588165283203125, 2.6861572265625, 2.784149169921875, 2.88214111328125, 2.980133056640625, 3.078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 27.0, 61.0, 142.0, 248.0, 269.0, 122.0, 51.0, 22.0, 13.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.43701934814453, -44.16937255859375, -42.901729583740234, -41.63408279418945, -40.36643981933594, -39.098793029785156, -37.831146240234375, -36.563499450683594, -35.29585647583008, -34.0282096862793, -32.76056671142578, -31.492919921875, -30.22527503967285, -28.957630157470703, -27.689983367919922, -26.422338485717773, -25.154693603515625, -23.887048721313477, -22.619403839111328, -21.351757049560547, -20.0841121673584, -18.81646728515625, -17.54882049560547, -16.28117561340332, -15.013530731201172, -13.745885848999023, -12.478240013122559, -11.210594177246094, -9.942949295043945, -8.675304412841797, -7.407658576965332, -6.140012741088867, -4.872364044189453, -3.6047186851501465, -2.33707332611084, -1.0694279670715332, 0.19821739196777344, 1.46586275100708, 2.7335081100463867, 4.001153945922852, 5.268798828125, 6.536444187164307, 7.804089546203613, 9.071735382080078, 10.339380264282227, 11.607025146484375, 12.87467098236084, 14.142316818237305, 15.409961700439453, 16.6776065826416, 17.94525146484375, 19.21289825439453, 20.48054313659668, 21.748188018798828, 23.01583480834961, 24.283479690551758, 25.551124572753906, 26.818769454956055, 28.086414337158203, 29.354061126708984, 30.621706008911133, 31.88935089111328, 33.15699768066406, 34.424644470214844, 35.69228744506836]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 12.0, 8.0, 14.0, 12.0, 12.0, 15.0, 18.0, 25.0, 15.0, 27.0, 33.0, 31.0, 28.0, 25.0, 32.0, 44.0, 49.0, 51.0, 39.0, 50.0, 44.0, 43.0, 34.0, 37.0, 29.0, 37.0, 37.0, 29.0, 17.0, 25.0, 10.0, 18.0, 17.0, 14.0, 8.0, 8.0, 5.0, 6.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.222179412841797, -10.851251602172852, -10.480324745178223, -10.109396934509277, -9.738469123840332, -9.367541313171387, -8.996614456176758, -8.625686645507812, -8.254758834838867, -7.88383150100708, -7.512903690338135, -7.141976356506348, -6.771048545837402, -6.400121212005615, -6.029193878173828, -5.658266067504883, -5.287338733673096, -4.916411399841309, -4.545483589172363, -4.174556255340576, -3.803628444671631, -3.4327011108398438, -3.0617735385894775, -2.6908459663391113, -2.319918394088745, -1.948990821838379, -1.5780632495880127, -1.207135796546936, -0.8362082242965698, -0.4652806520462036, -0.09435319900512695, 0.27657437324523926, 0.6475019454956055, 1.0184295177459717, 1.389357089996338, 1.7602845430374146, 2.1312122344970703, 2.5021395683288574, 2.8730671405792236, 3.24399471282959, 3.614922285079956, 3.9858498573303223, 4.356777191162109, 4.727705001831055, 5.098632335662842, 5.469560146331787, 5.840487480163574, 6.2114152908325195, 6.582342624664307, 6.953269958496094, 7.324197769165039, 7.695125102996826, 8.066052436828613, 8.436980247497559, 8.807908058166504, 9.178834915161133, 9.549762725830078, 9.920690536499023, 10.291617393493652, 10.662545204162598, 11.033473014831543, 11.404400825500488, 11.775327682495117, 12.146255493164062, 12.517183303833008]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 7.0, 12.0, 11.0, 18.0, 32.0, 50.0, 51.0, 79.0, 120.0, 202.0, 270.0, 454.0, 690.0, 1187.0, 2099.0, 4123.0, 9196.0, 23504.0, 68653.0, 239542.0, 472439.0, 149015.0, 45895.0, 16540.0, 6794.0, 3165.0, 1706.0, 1022.0, 579.0, 344.0, 224.0, 155.0, 120.0, 71.0, 49.0, 38.0, 34.0, 19.0, 17.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.361328125, -3.25732421875, -3.1533203125, -3.04931640625, -2.9453125, -2.84130859375, -2.7373046875, -2.63330078125, -2.529296875, -2.42529296875, -2.3212890625, -2.21728515625, -2.11328125, -2.00927734375, -1.9052734375, -1.80126953125, -1.697265625, -1.59326171875, -1.4892578125, -1.38525390625, -1.28125, -1.17724609375, -1.0732421875, -0.96923828125, -0.865234375, -0.76123046875, -0.6572265625, -0.55322265625, -0.44921875, -0.34521484375, -0.2412109375, -0.13720703125, -0.033203125, 0.07080078125, 0.1748046875, 0.27880859375, 0.3828125, 0.48681640625, 0.5908203125, 0.69482421875, 0.798828125, 0.90283203125, 1.0068359375, 1.11083984375, 1.21484375, 1.31884765625, 1.4228515625, 1.52685546875, 1.630859375, 1.73486328125, 1.8388671875, 1.94287109375, 2.046875, 2.15087890625, 2.2548828125, 2.35888671875, 2.462890625, 2.56689453125, 2.6708984375, 2.77490234375, 2.87890625, 2.98291015625, 3.0869140625, 3.19091796875, 3.294921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 8.0, 6.0, 11.0, 10.0, 31.0, 35.0, 30.0, 51.0, 56.0, 73.0, 75.0, 71.0, 75.0, 73.0, 75.0, 57.0, 49.0, 39.0, 37.0, 42.0, 28.0, 14.0, 20.0, 11.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9340972900390625, -1.877960205078125, -1.8218231201171875, -1.76568603515625, -1.7095489501953125, -1.653411865234375, -1.5972747802734375, -1.5411376953125, -1.4850006103515625, -1.428863525390625, -1.3727264404296875, -1.31658935546875, -1.2604522705078125, -1.204315185546875, -1.1481781005859375, -1.092041015625, -1.0359039306640625, -0.979766845703125, -0.9236297607421875, -0.86749267578125, -0.8113555908203125, -0.755218505859375, -0.6990814208984375, -0.6429443359375, -0.5868072509765625, -0.530670166015625, -0.4745330810546875, -0.41839599609375, -0.3622589111328125, -0.306121826171875, -0.2499847412109375, -0.19384765625, -0.1377105712890625, -0.081573486328125, -0.0254364013671875, 0.03070068359375, 0.0868377685546875, 0.142974853515625, 0.1991119384765625, 0.2552490234375, 0.3113861083984375, 0.367523193359375, 0.4236602783203125, 0.47979736328125, 0.5359344482421875, 0.592071533203125, 0.6482086181640625, 0.704345703125, 0.7604827880859375, 0.816619873046875, 0.8727569580078125, 0.92889404296875, 0.9850311279296875, 1.041168212890625, 1.0973052978515625, 1.1534423828125, 1.2095794677734375, 1.265716552734375, 1.3218536376953125, 1.37799072265625, 1.4341278076171875, 1.490264892578125, 1.5464019775390625, 1.6025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 16.0, 24.0, 56.0, 71.0, 126.0, 227.0, 424.0, 963.0, 2951.0, 13287.0, 120502.0, 806950.0, 87760.0, 10877.0, 2563.0, 852.0, 417.0, 189.0, 105.0, 60.0, 36.0, 31.0, 13.0, 11.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66766357421875, -6.4486083984375, -6.22955322265625, -6.010498046875, -5.79144287109375, -5.5723876953125, -5.35333251953125, -5.13427734375, -4.91522216796875, -4.6961669921875, -4.47711181640625, -4.258056640625, -4.03900146484375, -3.8199462890625, -3.60089111328125, -3.3818359375, -3.16278076171875, -2.9437255859375, -2.72467041015625, -2.505615234375, -2.28656005859375, -2.0675048828125, -1.84844970703125, -1.62939453125, -1.41033935546875, -1.1912841796875, -0.97222900390625, -0.753173828125, -0.53411865234375, -0.3150634765625, -0.09600830078125, 0.123046875, 0.34210205078125, 0.5611572265625, 0.78021240234375, 0.999267578125, 1.21832275390625, 1.4373779296875, 1.65643310546875, 1.87548828125, 2.09454345703125, 2.3135986328125, 2.53265380859375, 2.751708984375, 2.97076416015625, 3.1898193359375, 3.40887451171875, 3.6279296875, 3.84698486328125, 4.0660400390625, 4.28509521484375, 4.504150390625, 4.72320556640625, 4.9422607421875, 5.16131591796875, 5.38037109375, 5.59942626953125, 5.8184814453125, 6.03753662109375, 6.256591796875, 6.47564697265625, 6.6947021484375, 6.91375732421875, 7.1328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 19.0, 25.0, 21.0, 26.0, 24.0, 30.0, 43.0, 42.0, 43.0, 45.0, 48.0, 63.0, 65.0, 41.0, 48.0, 41.0, 46.0, 31.0, 42.0, 42.0, 22.0, 23.0, 22.0, 20.0, 10.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -3.97186279296875, -3.8265380859375, -3.68121337890625, -3.535888671875, -3.39056396484375, -3.2452392578125, -3.09991455078125, -2.95458984375, -2.80926513671875, -2.6639404296875, -2.51861572265625, -2.373291015625, -2.22796630859375, -2.0826416015625, -1.93731689453125, -1.7919921875, -1.64666748046875, -1.5013427734375, -1.35601806640625, -1.210693359375, -1.06536865234375, -0.9200439453125, -0.77471923828125, -0.62939453125, -0.48406982421875, -0.3387451171875, -0.19342041015625, -0.048095703125, 0.09722900390625, 0.2425537109375, 0.38787841796875, 0.533203125, 0.67852783203125, 0.8238525390625, 0.96917724609375, 1.114501953125, 1.25982666015625, 1.4051513671875, 1.55047607421875, 1.69580078125, 1.84112548828125, 1.9864501953125, 2.13177490234375, 2.277099609375, 2.42242431640625, 2.5677490234375, 2.71307373046875, 2.8583984375, 3.00372314453125, 3.1490478515625, 3.29437255859375, 3.439697265625, 3.58502197265625, 3.7303466796875, 3.87567138671875, 4.02099609375, 4.16632080078125, 4.3116455078125, 4.45697021484375, 4.602294921875, 4.74761962890625, 4.8929443359375, 5.03826904296875, 5.18359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 11.0, 14.0, 22.0, 59.0, 116.0, 236.0, 546.0, 1882.0, 11894.0, 307544.0, 703347.0, 19082.0, 2533.0, 672.0, 262.0, 117.0, 75.0, 37.0, 32.0, 14.0, 8.0, 3.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.660308837890625, -3.55889892578125, -3.457489013671875, -3.3560791015625, -3.254669189453125, -3.15325927734375, -3.051849365234375, -2.950439453125, -2.849029541015625, -2.74761962890625, -2.646209716796875, -2.5447998046875, -2.443389892578125, -2.34197998046875, -2.240570068359375, -2.13916015625, -2.037750244140625, -1.93634033203125, -1.834930419921875, -1.7335205078125, -1.632110595703125, -1.53070068359375, -1.429290771484375, -1.327880859375, -1.226470947265625, -1.12506103515625, -1.023651123046875, -0.9222412109375, -0.820831298828125, -0.71942138671875, -0.618011474609375, -0.5166015625, -0.415191650390625, -0.31378173828125, -0.212371826171875, -0.1109619140625, -0.009552001953125, 0.09185791015625, 0.193267822265625, 0.294677734375, 0.396087646484375, 0.49749755859375, 0.598907470703125, 0.7003173828125, 0.801727294921875, 0.90313720703125, 1.004547119140625, 1.10595703125, 1.207366943359375, 1.30877685546875, 1.410186767578125, 1.5115966796875, 1.613006591796875, 1.71441650390625, 1.815826416015625, 1.917236328125, 2.018646240234375, 2.12005615234375, 2.221466064453125, 2.3228759765625, 2.424285888671875, 2.52569580078125, 2.627105712890625, 2.728515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 14.0, 10.0, 18.0, 36.0, 34.0, 47.0, 58.0, 78.0, 113.0, 118.0, 111.0, 95.0, 63.0, 62.0, 34.0, 34.0, 15.0, 13.0, 14.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027108192443847656, -0.0002601146697998047, -0.0002491474151611328, -0.00023818016052246094, -0.00022721290588378906, -0.0002162456512451172, -0.0002052783966064453, -0.00019431114196777344, -0.00018334388732910156, -0.0001723766326904297, -0.0001614093780517578, -0.00015044212341308594, -0.00013947486877441406, -0.0001285076141357422, -0.00011754035949707031, -0.00010657310485839844, -9.560585021972656e-05, -8.463859558105469e-05, -7.367134094238281e-05, -6.270408630371094e-05, -5.173683166503906e-05, -4.076957702636719e-05, -2.9802322387695312e-05, -1.8835067749023438e-05, -7.867813110351562e-06, 3.0994415283203125e-06, 1.4066696166992188e-05, 2.5033950805664062e-05, 3.600120544433594e-05, 4.696846008300781e-05, 5.793571472167969e-05, 6.890296936035156e-05, 7.987022399902344e-05, 9.083747863769531e-05, 0.00010180473327636719, 0.00011277198791503906, 0.00012373924255371094, 0.0001347064971923828, 0.0001456737518310547, 0.00015664100646972656, 0.00016760826110839844, 0.0001785755157470703, 0.0001895427703857422, 0.00020051002502441406, 0.00021147727966308594, 0.0002224445343017578, 0.0002334117889404297, 0.00024437904357910156, 0.00025534629821777344, 0.0002663135528564453, 0.0002772808074951172, 0.00028824806213378906, 0.00029921531677246094, 0.0003101825714111328, 0.0003211498260498047, 0.00033211708068847656, 0.00034308433532714844, 0.0003540515899658203, 0.0003650188446044922, 0.00037598609924316406, 0.00038695335388183594, 0.0003979206085205078, 0.0004088878631591797, 0.00041985511779785156, 0.00043082237243652344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 12.0, 12.0, 16.0, 31.0, 42.0, 67.0, 113.0, 173.0, 327.0, 613.0, 1368.0, 4021.0, 18452.0, 171825.0, 767641.0, 68746.0, 10161.0, 2721.0, 1061.0, 460.0, 270.0, 167.0, 87.0, 53.0, 26.0, 23.0, 16.0, 16.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8828125, -1.818603515625, -1.75439453125, -1.690185546875, -1.6259765625, -1.561767578125, -1.49755859375, -1.433349609375, -1.369140625, -1.304931640625, -1.24072265625, -1.176513671875, -1.1123046875, -1.048095703125, -0.98388671875, -0.919677734375, -0.85546875, -0.791259765625, -0.72705078125, -0.662841796875, -0.5986328125, -0.534423828125, -0.47021484375, -0.406005859375, -0.341796875, -0.277587890625, -0.21337890625, -0.149169921875, -0.0849609375, -0.020751953125, 0.04345703125, 0.107666015625, 0.171875, 0.236083984375, 0.30029296875, 0.364501953125, 0.4287109375, 0.492919921875, 0.55712890625, 0.621337890625, 0.685546875, 0.749755859375, 0.81396484375, 0.878173828125, 0.9423828125, 1.006591796875, 1.07080078125, 1.135009765625, 1.19921875, 1.263427734375, 1.32763671875, 1.391845703125, 1.4560546875, 1.520263671875, 1.58447265625, 1.648681640625, 1.712890625, 1.777099609375, 1.84130859375, 1.905517578125, 1.9697265625, 2.033935546875, 2.09814453125, 2.162353515625, 2.2265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 3.0, 9.0, 16.0, 16.0, 30.0, 33.0, 40.0, 35.0, 61.0, 56.0, 76.0, 98.0, 78.0, 76.0, 68.0, 63.0, 39.0, 40.0, 35.0, 16.0, 20.0, 24.0, 11.0, 4.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9248046875, -1.8764495849609375, -1.828094482421875, -1.7797393798828125, -1.73138427734375, -1.6830291748046875, -1.634674072265625, -1.5863189697265625, -1.5379638671875, -1.4896087646484375, -1.441253662109375, -1.3928985595703125, -1.34454345703125, -1.2961883544921875, -1.247833251953125, -1.1994781494140625, -1.151123046875, -1.1027679443359375, -1.054412841796875, -1.0060577392578125, -0.95770263671875, -0.9093475341796875, -0.860992431640625, -0.8126373291015625, -0.7642822265625, -0.7159271240234375, -0.667572021484375, -0.6192169189453125, -0.57086181640625, -0.5225067138671875, -0.474151611328125, -0.4257965087890625, -0.37744140625, -0.3290863037109375, -0.280731201171875, -0.2323760986328125, -0.18402099609375, -0.1356658935546875, -0.087310791015625, -0.0389556884765625, 0.0093994140625, 0.0577545166015625, 0.106109619140625, 0.1544647216796875, 0.20281982421875, 0.2511749267578125, 0.299530029296875, 0.3478851318359375, 0.396240234375, 0.4445953369140625, 0.492950439453125, 0.5413055419921875, 0.58966064453125, 0.6380157470703125, 0.686370849609375, 0.7347259521484375, 0.7830810546875, 0.8314361572265625, 0.879791259765625, 0.9281463623046875, 0.97650146484375, 1.0248565673828125, 1.073211669921875, 1.1215667724609375, 1.169921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 14.0, 53.0, 131.0, 345.0, 291.0, 113.0, 30.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.91323852539062, -71.73523712158203, -69.5572280883789, -67.37922668457031, -65.20121765136719, -63.023216247558594, -60.845211029052734, -58.667205810546875, -56.48920440673828, -54.31119918823242, -52.13319396972656, -49.95519256591797, -47.77718734741211, -45.59918212890625, -43.42117691040039, -41.24317169189453, -39.06516647338867, -36.88716125488281, -34.70915603637695, -32.531150817871094, -30.3531494140625, -28.17514419555664, -25.99713897705078, -23.819133758544922, -21.641130447387695, -19.463125228881836, -17.28512191772461, -15.10711669921875, -12.929112434387207, -10.751108169555664, -8.573102951049805, -6.395098686218262, -4.217094421386719, -2.0390899181365967, 0.1389145851135254, 2.3169193267822266, 4.4949235916137695, 6.6729278564453125, 8.850933074951172, 11.028937339782715, 13.206941604614258, 15.3849458694458, 17.562950134277344, 19.740955352783203, 21.918960571289062, 24.09696388244629, 26.27496910095215, 28.452972412109375, 30.630977630615234, 32.808982849121094, 34.98698806762695, 37.16499328613281, 39.342994689941406, 41.520999908447266, 43.699005126953125, 45.877010345458984, 48.055015563964844, 50.2330207824707, 52.41102600097656, 54.589027404785156, 56.767032623291016, 58.945037841796875, 61.123043060302734, 63.301048278808594, 65.47904968261719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 9.0, 15.0, 23.0, 22.0, 16.0, 31.0, 28.0, 31.0, 29.0, 41.0, 46.0, 62.0, 68.0, 69.0, 59.0, 64.0, 37.0, 30.0, 51.0, 36.0, 43.0, 31.0, 21.0, 21.0, 24.0, 15.0, 13.0, 7.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.756563186645508, -21.063051223754883, -20.369537353515625, -19.676025390625, -18.982513427734375, -18.288999557495117, -17.595487594604492, -16.901973724365234, -16.20846176147461, -15.514948844909668, -14.821435928344727, -14.127923965454102, -13.43441104888916, -12.740898132324219, -12.047386169433594, -11.353873252868652, -10.660360336303711, -9.96684741973877, -9.273334503173828, -8.579822540283203, -7.886309623718262, -7.19279670715332, -6.499284267425537, -5.805771827697754, -5.1122589111328125, -4.418745994567871, -3.725233554840088, -3.0317208766937256, -2.3382081985473633, -1.644695520401001, -0.9511828422546387, -0.25767040252685547, 0.43584442138671875, 1.129357099533081, 1.8228697776794434, 2.5163824558258057, 3.209895133972168, 3.9034078121185303, 4.596920490264893, 5.290432929992676, 5.983945846557617, 6.677458763122559, 7.370971202850342, 8.064483642578125, 8.757996559143066, 9.451509475708008, 10.145021438598633, 10.838534355163574, 11.532047271728516, 12.225560188293457, 12.919073104858398, 13.612585067749023, 14.306097984313965, 14.999610900878906, 15.693122863769531, 16.386634826660156, 17.080148696899414, 17.77366065979004, 18.467174530029297, 19.160686492919922, 19.854198455810547, 20.547712326049805, 21.24122428894043, 21.934738159179688, 22.628250122070312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 9.0, 20.0, 25.0, 32.0, 49.0, 76.0, 131.0, 250.0, 419.0, 823.0, 1640.0, 3729.0, 9186.0, 26044.0, 103478.0, 1071102.0, 2673471.0, 233502.0, 45767.0, 14388.0, 5687.0, 2334.0, 1089.0, 480.0, 258.0, 118.0, 77.0, 31.0, 14.0, 10.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.5604248046875, -2.499755859375, -2.4390869140625, -2.37841796875, -2.3177490234375, -2.257080078125, -2.1964111328125, -2.1357421875, -2.0750732421875, -2.014404296875, -1.9537353515625, -1.89306640625, -1.8323974609375, -1.771728515625, -1.7110595703125, -1.650390625, -1.5897216796875, -1.529052734375, -1.4683837890625, -1.40771484375, -1.3470458984375, -1.286376953125, -1.2257080078125, -1.1650390625, -1.1043701171875, -1.043701171875, -0.9830322265625, -0.92236328125, -0.8616943359375, -0.801025390625, -0.7403564453125, -0.6796875, -0.6190185546875, -0.558349609375, -0.4976806640625, -0.43701171875, -0.3763427734375, -0.315673828125, -0.2550048828125, -0.1943359375, -0.1336669921875, -0.072998046875, -0.0123291015625, 0.04833984375, 0.1090087890625, 0.169677734375, 0.2303466796875, 0.291015625, 0.3516845703125, 0.412353515625, 0.4730224609375, 0.53369140625, 0.5943603515625, 0.655029296875, 0.7156982421875, 0.7763671875, 0.8370361328125, 0.897705078125, 0.9583740234375, 1.01904296875, 1.0797119140625, 1.140380859375, 1.2010498046875, 1.26171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 16.0, 16.0, 22.0, 34.0, 34.0, 63.0, 66.0, 67.0, 79.0, 75.0, 88.0, 84.0, 65.0, 78.0, 52.0, 41.0, 33.0, 23.0, 24.0, 18.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6484375, -2.5921859741210938, -2.5359344482421875, -2.4796829223632812, -2.423431396484375, -2.3671798706054688, -2.3109283447265625, -2.2546768188476562, -2.19842529296875, -2.1421737670898438, -2.0859222412109375, -2.0296707153320312, -1.973419189453125, -1.9171676635742188, -1.8609161376953125, -1.8046646118164062, -1.7484130859375, -1.6921615600585938, -1.6359100341796875, -1.5796585083007812, -1.523406982421875, -1.4671554565429688, -1.4109039306640625, -1.3546524047851562, -1.29840087890625, -1.2421493530273438, -1.1858978271484375, -1.1296463012695312, -1.073394775390625, -1.0171432495117188, -0.9608917236328125, -0.9046401977539062, -0.848388671875, -0.7921371459960938, -0.7358856201171875, -0.6796340942382812, -0.623382568359375, -0.5671310424804688, -0.5108795166015625, -0.45462799072265625, -0.39837646484375, -0.34212493896484375, -0.2858734130859375, -0.22962188720703125, -0.173370361328125, -0.11711883544921875, -0.0608673095703125, -0.00461578369140625, 0.0516357421875, 0.10788726806640625, 0.1641387939453125, 0.22039031982421875, 0.276641845703125, 0.33289337158203125, 0.3891448974609375, 0.44539642333984375, 0.50164794921875, 0.5578994750976562, 0.6141510009765625, 0.6704025268554688, 0.726654052734375, 0.7829055786132812, 0.8391571044921875, 0.8954086303710938, 0.95166015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 12.0, 16.0, 13.0, 21.0, 44.0, 39.0, 96.0, 144.0, 251.0, 441.0, 953.0, 2061.0, 5204.0, 15182.0, 55558.0, 343458.0, 3334046.0, 344052.0, 61234.0, 18282.0, 6875.0, 2989.0, 1388.0, 763.0, 430.0, 246.0, 163.0, 98.0, 66.0, 39.0, 31.0, 22.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.57757568359375, -2.4930419921875, -2.40850830078125, -2.323974609375, -2.23944091796875, -2.1549072265625, -2.07037353515625, -1.98583984375, -1.90130615234375, -1.8167724609375, -1.73223876953125, -1.647705078125, -1.56317138671875, -1.4786376953125, -1.39410400390625, -1.3095703125, -1.22503662109375, -1.1405029296875, -1.05596923828125, -0.971435546875, -0.88690185546875, -0.8023681640625, -0.71783447265625, -0.63330078125, -0.54876708984375, -0.4642333984375, -0.37969970703125, -0.295166015625, -0.21063232421875, -0.1260986328125, -0.04156494140625, 0.04296875, 0.12750244140625, 0.2120361328125, 0.29656982421875, 0.381103515625, 0.46563720703125, 0.5501708984375, 0.63470458984375, 0.71923828125, 0.80377197265625, 0.8883056640625, 0.97283935546875, 1.057373046875, 1.14190673828125, 1.2264404296875, 1.31097412109375, 1.3955078125, 1.48004150390625, 1.5645751953125, 1.64910888671875, 1.733642578125, 1.81817626953125, 1.9027099609375, 1.98724365234375, 2.07177734375, 2.15631103515625, 2.2408447265625, 2.32537841796875, 2.409912109375, 2.49444580078125, 2.5789794921875, 2.66351318359375, 2.748046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 0.0, 8.0, 9.0, 6.0, 15.0, 9.0, 19.0, 19.0, 28.0, 45.0, 47.0, 74.0, 87.0, 172.0, 225.0, 412.0, 764.0, 744.0, 455.0, 256.0, 160.0, 105.0, 102.0, 74.0, 36.0, 40.0, 31.0, 23.0, 19.0, 14.0, 10.0, 16.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.169921875, -2.086669921875, -2.00341796875, -1.920166015625, -1.8369140625, -1.753662109375, -1.67041015625, -1.587158203125, -1.50390625, -1.420654296875, -1.33740234375, -1.254150390625, -1.1708984375, -1.087646484375, -1.00439453125, -0.921142578125, -0.837890625, -0.754638671875, -0.67138671875, -0.588134765625, -0.5048828125, -0.421630859375, -0.33837890625, -0.255126953125, -0.171875, -0.088623046875, -0.00537109375, 0.077880859375, 0.1611328125, 0.244384765625, 0.32763671875, 0.410888671875, 0.494140625, 0.577392578125, 0.66064453125, 0.743896484375, 0.8271484375, 0.910400390625, 0.99365234375, 1.076904296875, 1.16015625, 1.243408203125, 1.32666015625, 1.409912109375, 1.4931640625, 1.576416015625, 1.65966796875, 1.742919921875, 1.826171875, 1.909423828125, 1.99267578125, 2.075927734375, 2.1591796875, 2.242431640625, 2.32568359375, 2.408935546875, 2.4921875, 2.575439453125, 2.65869140625, 2.741943359375, 2.8251953125, 2.908447265625, 2.99169921875, 3.074951171875, 3.158203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 43.0, 134.0, 329.0, 294.0, 107.0, 38.0, 11.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229286193847656, -28.30753517150879, -26.385784149169922, -24.464035034179688, -22.542282104492188, -20.620532989501953, -18.698781967163086, -16.77703094482422, -14.855279922485352, -12.933528900146484, -11.011777877807617, -9.090027809143066, -7.168276786804199, -5.246525764465332, -3.3247756958007812, -1.403024673461914, 0.5187263488769531, 2.440477132797241, 4.362227916717529, 6.283978462219238, 8.205729484558105, 10.127480506896973, 12.049230575561523, 13.97098159790039, 15.892732620239258, 17.814483642578125, 19.736234664916992, 21.65798568725586, 23.579734802246094, 25.501487731933594, 27.423236846923828, 29.344987869262695, 31.266738891601562, 33.1884880065918, 35.1102409362793, 37.03199005126953, 38.95374298095703, 40.875492095947266, 42.7972412109375, 44.718994140625, 46.6407470703125, 48.562496185302734, 50.484249114990234, 52.40599822998047, 54.32775115966797, 56.2495002746582, 58.17124938964844, 60.09300231933594, 62.01475143432617, 63.936500549316406, 65.8582534790039, 67.7800064086914, 69.70175170898438, 71.62350463867188, 73.54525756835938, 75.46701049804688, 77.38875579833984, 79.31050872802734, 81.23225402832031, 83.15400695800781, 85.07575988769531, 86.99751281738281, 88.91925811767578, 90.84101104736328, 92.76276397705078]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 8.0, 9.0, 15.0, 15.0, 26.0, 33.0, 48.0, 34.0, 66.0, 61.0, 67.0, 54.0, 59.0, 62.0, 56.0, 61.0, 63.0, 46.0, 34.0, 27.0, 30.0, 22.0, 24.0, 17.0, 14.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.80950927734375, -16.142671585083008, -15.475834846496582, -14.808998107910156, -14.142160415649414, -13.475323677062988, -12.808486938476562, -12.14164924621582, -11.474812507629395, -10.807975769042969, -10.141138076782227, -9.4743013381958, -8.807464599609375, -8.140626907348633, -7.473790168762207, -6.806952953338623, -6.140115737915039, -5.473278522491455, -4.806441307067871, -4.139604568481445, -3.4727673530578613, -2.8059301376342773, -2.1390933990478516, -1.4722561836242676, -0.8054189682006836, -0.13858187198638916, 0.5282552242279053, 1.1950922012329102, 1.8619294166564941, 2.528766632080078, 3.195603370666504, 3.862440586090088, 4.529279708862305, 5.196116924285889, 5.862954139709473, 6.529790878295898, 7.196628093719482, 7.863465309143066, 8.530302047729492, 9.197139739990234, 9.86397647857666, 10.530813217163086, 11.197650909423828, 11.864487648010254, 12.53132438659668, 13.198162078857422, 13.864998817443848, 14.531835556030273, 15.198673248291016, 15.865509986877441, 16.532346725463867, 17.19918441772461, 17.86602210998535, 18.532859802246094, 19.199695587158203, 19.866533279418945, 20.533370971679688, 21.20020866394043, 21.86704444885254, 22.53388214111328, 23.200719833374023, 23.867557525634766, 24.534393310546875, 25.201231002807617, 25.868066787719727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 6.0, 15.0, 14.0, 35.0, 43.0, 57.0, 78.0, 116.0, 175.0, 293.0, 441.0, 803.0, 1429.0, 2742.0, 5090.0, 10122.0, 21371.0, 46154.0, 103427.0, 244941.0, 338307.0, 148890.0, 64969.0, 29868.0, 14309.0, 6758.0, 3563.0, 1820.0, 1088.0, 607.0, 356.0, 218.0, 131.0, 108.0, 53.0, 45.0, 36.0, 17.0, 13.0, 14.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.30078125, -2.2293701171875, -2.157958984375, -2.0865478515625, -2.01513671875, -1.9437255859375, -1.872314453125, -1.8009033203125, -1.7294921875, -1.6580810546875, -1.586669921875, -1.5152587890625, -1.44384765625, -1.3724365234375, -1.301025390625, -1.2296142578125, -1.158203125, -1.0867919921875, -1.015380859375, -0.9439697265625, -0.87255859375, -0.8011474609375, -0.729736328125, -0.6583251953125, -0.5869140625, -0.5155029296875, -0.444091796875, -0.3726806640625, -0.30126953125, -0.2298583984375, -0.158447265625, -0.0870361328125, -0.015625, 0.0557861328125, 0.127197265625, 0.1986083984375, 0.27001953125, 0.3414306640625, 0.412841796875, 0.4842529296875, 0.5556640625, 0.6270751953125, 0.698486328125, 0.7698974609375, 0.84130859375, 0.9127197265625, 0.984130859375, 1.0555419921875, 1.126953125, 1.1983642578125, 1.269775390625, 1.3411865234375, 1.41259765625, 1.4840087890625, 1.555419921875, 1.6268310546875, 1.6982421875, 1.7696533203125, 1.841064453125, 1.9124755859375, 1.98388671875, 2.0552978515625, 2.126708984375, 2.1981201171875, 2.26953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 20.0, 8.0, 12.0, 15.0, 14.0, 22.0, 36.0, 30.0, 37.0, 29.0, 32.0, 33.0, 34.0, 40.0, 46.0, 47.0, 42.0, 51.0, 50.0, 36.0, 39.0, 42.0, 40.0, 21.0, 25.0, 30.0, 14.0, 16.0, 14.0, 17.0, 18.0, 11.0, 6.0, 12.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.9296875, -0.9017715454101562, -0.8738555908203125, -0.8459396362304688, -0.818023681640625, -0.7901077270507812, -0.7621917724609375, -0.7342758178710938, -0.70635986328125, -0.6784439086914062, -0.6505279541015625, -0.6226119995117188, -0.594696044921875, -0.5667800903320312, -0.5388641357421875, -0.5109481811523438, -0.4830322265625, -0.45511627197265625, -0.4272003173828125, -0.39928436279296875, -0.371368408203125, -0.34345245361328125, -0.3155364990234375, -0.28762054443359375, -0.25970458984375, -0.23178863525390625, -0.2038726806640625, -0.17595672607421875, -0.148040771484375, -0.12012481689453125, -0.0922088623046875, -0.06429290771484375, -0.036376953125, -0.00846099853515625, 0.0194549560546875, 0.04737091064453125, 0.075286865234375, 0.10320281982421875, 0.1311187744140625, 0.15903472900390625, 0.18695068359375, 0.21486663818359375, 0.2427825927734375, 0.27069854736328125, 0.298614501953125, 0.32653045654296875, 0.3544464111328125, 0.38236236572265625, 0.4102783203125, 0.43819427490234375, 0.4661102294921875, 0.49402618408203125, 0.521942138671875, 0.5498580932617188, 0.5777740478515625, 0.6056900024414062, 0.63360595703125, 0.6615219116210938, 0.6894378662109375, 0.7173538208007812, 0.745269775390625, 0.7731857299804688, 0.8011016845703125, 0.8290176391601562, 0.85693359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 10.0, 12.0, 17.0, 24.0, 31.0, 40.0, 53.0, 85.0, 125.0, 152.0, 206.0, 331.0, 528.0, 805.0, 1306.0, 2348.0, 4733.0, 12647.0, 48594.0, 259469.0, 593513.0, 89179.0, 20119.0, 6637.0, 3007.0, 1655.0, 974.0, 623.0, 408.0, 251.0, 187.0, 125.0, 98.0, 53.0, 52.0, 37.0, 33.0, 24.0, 11.0, 10.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.537109375, -3.4237060546875, -3.310302734375, -3.1968994140625, -3.08349609375, -2.9700927734375, -2.856689453125, -2.7432861328125, -2.6298828125, -2.5164794921875, -2.403076171875, -2.2896728515625, -2.17626953125, -2.0628662109375, -1.949462890625, -1.8360595703125, -1.72265625, -1.6092529296875, -1.495849609375, -1.3824462890625, -1.26904296875, -1.1556396484375, -1.042236328125, -0.9288330078125, -0.8154296875, -0.7020263671875, -0.588623046875, -0.4752197265625, -0.36181640625, -0.2484130859375, -0.135009765625, -0.0216064453125, 0.091796875, 0.2052001953125, 0.318603515625, 0.4320068359375, 0.54541015625, 0.6588134765625, 0.772216796875, 0.8856201171875, 0.9990234375, 1.1124267578125, 1.225830078125, 1.3392333984375, 1.45263671875, 1.5660400390625, 1.679443359375, 1.7928466796875, 1.90625, 2.0196533203125, 2.133056640625, 2.2464599609375, 2.35986328125, 2.4732666015625, 2.586669921875, 2.7000732421875, 2.8134765625, 2.9268798828125, 3.040283203125, 3.1536865234375, 3.26708984375, 3.3804931640625, 3.493896484375, 3.6072998046875, 3.720703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 16.0, 7.0, 14.0, 17.0, 20.0, 29.0, 31.0, 38.0, 39.0, 47.0, 60.0, 48.0, 59.0, 60.0, 60.0, 64.0, 56.0, 42.0, 36.0, 33.0, 33.0, 30.0, 19.0, 27.0, 22.0, 20.0, 11.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32757568359375, -5.1707763671875, -5.01397705078125, -4.857177734375, -4.70037841796875, -4.5435791015625, -4.38677978515625, -4.22998046875, -4.07318115234375, -3.9163818359375, -3.75958251953125, -3.602783203125, -3.44598388671875, -3.2891845703125, -3.13238525390625, -2.9755859375, -2.81878662109375, -2.6619873046875, -2.50518798828125, -2.348388671875, -2.19158935546875, -2.0347900390625, -1.87799072265625, -1.72119140625, -1.56439208984375, -1.4075927734375, -1.25079345703125, -1.093994140625, -0.93719482421875, -0.7803955078125, -0.62359619140625, -0.466796875, -0.30999755859375, -0.1531982421875, 0.00360107421875, 0.160400390625, 0.31719970703125, 0.4739990234375, 0.63079833984375, 0.78759765625, 0.94439697265625, 1.1011962890625, 1.25799560546875, 1.414794921875, 1.57159423828125, 1.7283935546875, 1.88519287109375, 2.0419921875, 2.19879150390625, 2.3555908203125, 2.51239013671875, 2.669189453125, 2.82598876953125, 2.9827880859375, 3.13958740234375, 3.29638671875, 3.45318603515625, 3.6099853515625, 3.76678466796875, 3.923583984375, 4.08038330078125, 4.2371826171875, 4.39398193359375, 4.55078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 14.0, 15.0, 41.0, 75.0, 166.0, 549.0, 2456.0, 32285.0, 958304.0, 50620.0, 3067.0, 581.0, 209.0, 95.0, 26.0, 22.0, 7.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.482879638671875, -2.38177490234375, -2.280670166015625, -2.1795654296875, -2.078460693359375, -1.97735595703125, -1.876251220703125, -1.775146484375, -1.674041748046875, -1.57293701171875, -1.471832275390625, -1.3707275390625, -1.269622802734375, -1.16851806640625, -1.067413330078125, -0.96630859375, -0.865203857421875, -0.76409912109375, -0.662994384765625, -0.5618896484375, -0.460784912109375, -0.35968017578125, -0.258575439453125, -0.157470703125, -0.056365966796875, 0.04473876953125, 0.145843505859375, 0.2469482421875, 0.348052978515625, 0.44915771484375, 0.550262451171875, 0.6513671875, 0.752471923828125, 0.85357666015625, 0.954681396484375, 1.0557861328125, 1.156890869140625, 1.25799560546875, 1.359100341796875, 1.460205078125, 1.561309814453125, 1.66241455078125, 1.763519287109375, 1.8646240234375, 1.965728759765625, 2.06683349609375, 2.167938232421875, 2.26904296875, 2.370147705078125, 2.47125244140625, 2.572357177734375, 2.6734619140625, 2.774566650390625, 2.87567138671875, 2.976776123046875, 3.077880859375, 3.178985595703125, 3.28009033203125, 3.381195068359375, 3.4822998046875, 3.583404541015625, 3.68450927734375, 3.785614013671875, 3.88671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 24.0, 20.0, 34.0, 52.0, 72.0, 125.0, 163.0, 140.0, 103.0, 78.0, 54.0, 39.0, 24.0, 11.0, 9.0, 12.0, 6.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006084442138671875, -0.0005939304828643799, -0.0005794167518615723, -0.0005649030208587646, -0.000550389289855957, -0.0005358755588531494, -0.0005213618278503418, -0.0005068480968475342, -0.0004923343658447266, -0.00047782063484191895, -0.00046330690383911133, -0.0004487931728363037, -0.0004342794418334961, -0.0004197657108306885, -0.00040525197982788086, -0.00039073824882507324, -0.0003762245178222656, -0.000361710786819458, -0.0003471970558166504, -0.0003326833248138428, -0.00031816959381103516, -0.00030365586280822754, -0.0002891421318054199, -0.0002746284008026123, -0.0002601146697998047, -0.00024560093879699707, -0.00023108720779418945, -0.00021657347679138184, -0.00020205974578857422, -0.0001875460147857666, -0.00017303228378295898, -0.00015851855278015137, -0.00014400482177734375, -0.00012949109077453613, -0.00011497735977172852, -0.0001004636287689209, -8.594989776611328e-05, -7.143616676330566e-05, -5.692243576049805e-05, -4.240870475769043e-05, -2.7894973754882812e-05, -1.3381242752075195e-05, 1.1324882507324219e-06, 1.564621925354004e-05, 3.0159950256347656e-05, 4.4673681259155273e-05, 5.918741226196289e-05, 7.370114326477051e-05, 8.821487426757812e-05, 0.00010272860527038574, 0.00011724233627319336, 0.00013175606727600098, 0.0001462697982788086, 0.0001607835292816162, 0.00017529726028442383, 0.00018981099128723145, 0.00020432472229003906, 0.00021883845329284668, 0.0002333521842956543, 0.0002478659152984619, 0.00026237964630126953, 0.00027689337730407715, 0.00029140710830688477, 0.0003059208393096924, 0.0003204345703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 18.0, 20.0, 21.0, 36.0, 57.0, 90.0, 121.0, 131.0, 220.0, 335.0, 543.0, 952.0, 1760.0, 3531.0, 8749.0, 27526.0, 140490.0, 669361.0, 148433.0, 29300.0, 8741.0, 3652.0, 1728.0, 997.0, 571.0, 344.0, 237.0, 148.0, 100.0, 78.0, 57.0, 48.0, 29.0, 26.0, 11.0, 21.0, 11.0, 7.0, 6.0, 10.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9459762573242188, -0.9139251708984375, -0.8818740844726562, -0.849822998046875, -0.8177719116210938, -0.7857208251953125, -0.7536697387695312, -0.72161865234375, -0.6895675659179688, -0.6575164794921875, -0.6254653930664062, -0.593414306640625, -0.5613632202148438, -0.5293121337890625, -0.49726104736328125, -0.4652099609375, -0.43315887451171875, -0.4011077880859375, -0.36905670166015625, -0.337005615234375, -0.30495452880859375, -0.2729034423828125, -0.24085235595703125, -0.20880126953125, -0.17675018310546875, -0.1446990966796875, -0.11264801025390625, -0.080596923828125, -0.04854583740234375, -0.0164947509765625, 0.01555633544921875, 0.047607421875, 0.07965850830078125, 0.1117095947265625, 0.14376068115234375, 0.175811767578125, 0.20786285400390625, 0.2399139404296875, 0.27196502685546875, 0.30401611328125, 0.33606719970703125, 0.3681182861328125, 0.40016937255859375, 0.432220458984375, 0.46427154541015625, 0.4963226318359375, 0.5283737182617188, 0.5604248046875, 0.5924758911132812, 0.6245269775390625, 0.6565780639648438, 0.688629150390625, 0.7206802368164062, 0.7527313232421875, 0.7847824096679688, 0.81683349609375, 0.8488845825195312, 0.8809356689453125, 0.9129867553710938, 0.945037841796875, 0.9770889282226562, 1.0091400146484375, 1.0411911010742188, 1.0732421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 22.0, 18.0, 36.0, 30.0, 37.0, 42.0, 56.0, 54.0, 59.0, 63.0, 66.0, 71.0, 62.0, 46.0, 46.0, 31.0, 49.0, 29.0, 29.0, 30.0, 14.0, 16.0, 8.0, 3.0, 8.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0048675537109375, -0.971649169921875, -0.9384307861328125, -0.90521240234375, -0.8719940185546875, -0.838775634765625, -0.8055572509765625, -0.7723388671875, -0.7391204833984375, -0.705902099609375, -0.6726837158203125, -0.63946533203125, -0.6062469482421875, -0.573028564453125, -0.5398101806640625, -0.506591796875, -0.4733734130859375, -0.440155029296875, -0.4069366455078125, -0.37371826171875, -0.3404998779296875, -0.307281494140625, -0.2740631103515625, -0.2408447265625, -0.2076263427734375, -0.174407958984375, -0.1411895751953125, -0.10797119140625, -0.0747528076171875, -0.041534423828125, -0.0083160400390625, 0.02490234375, 0.0581207275390625, 0.091339111328125, 0.1245574951171875, 0.15777587890625, 0.1909942626953125, 0.224212646484375, 0.2574310302734375, 0.2906494140625, 0.3238677978515625, 0.357086181640625, 0.3903045654296875, 0.42352294921875, 0.4567413330078125, 0.489959716796875, 0.5231781005859375, 0.556396484375, 0.5896148681640625, 0.622833251953125, 0.6560516357421875, 0.68927001953125, 0.7224884033203125, 0.755706787109375, 0.7889251708984375, 0.8221435546875, 0.8553619384765625, 0.888580322265625, 0.9217987060546875, 0.95501708984375, 0.9882354736328125, 1.021453857421875, 1.0546722412109375, 1.087890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 16.0, 22.0, 35.0, 66.0, 89.0, 126.0, 248.0, 138.0, 94.0, 51.0, 41.0, 21.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.20698165893555, -35.37528610229492, -34.54359436035156, -33.71189880371094, -32.88020324707031, -32.04851150512695, -31.216815948486328, -30.385122299194336, -29.553428649902344, -28.72173500061035, -27.890039443969727, -27.058345794677734, -26.226652145385742, -25.39495849609375, -24.563262939453125, -23.731569290161133, -22.899873733520508, -22.068180084228516, -21.23648452758789, -20.4047908782959, -19.573097229003906, -18.74140167236328, -17.90970802307129, -17.078014373779297, -16.246318817138672, -15.414624214172363, -14.582930564880371, -13.751235961914062, -12.91954231262207, -12.087847709655762, -11.256153106689453, -10.424459457397461, -9.592767715454102, -8.761073112487793, -7.929379463195801, -7.097684860229492, -6.265990734100342, -5.434296607971191, -4.602602005004883, -3.7709078788757324, -2.939213752746582, -2.1075196266174316, -1.2758252620697021, -0.44413089752197266, 0.38756322860717773, 1.2192573547363281, 2.0509519577026367, 2.882646083831787, 3.7143402099609375, 4.546034336090088, 5.377728462219238, 6.209423065185547, 7.041117191314697, 7.872811317443848, 8.704505920410156, 9.536199569702148, 10.367894172668457, 11.199588775634766, 12.031282424926758, 12.862977027893066, 13.694671630859375, 14.526365280151367, 15.358059883117676, 16.189754486083984, 17.021448135375977]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 5.0, 6.0, 16.0, 12.0, 12.0, 18.0, 24.0, 28.0, 26.0, 18.0, 32.0, 38.0, 34.0, 48.0, 62.0, 73.0, 74.0, 73.0, 41.0, 33.0, 41.0, 45.0, 30.0, 33.0, 30.0, 17.0, 19.0, 17.0, 20.0, 10.0, 8.0, 10.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.68695068359375, -16.132951736450195, -15.57895278930664, -15.02495288848877, -14.470953941345215, -13.91695499420166, -13.362955093383789, -12.808956146240234, -12.25495719909668, -11.700958251953125, -11.14695930480957, -10.5929594039917, -10.038960456848145, -9.48496150970459, -8.930961608886719, -8.376962661743164, -7.822963714599609, -7.268964767456055, -6.714965343475342, -6.160965919494629, -5.606966972351074, -5.0529680252075195, -4.498968601226807, -3.944969415664673, -3.390970230102539, -2.8369710445404053, -2.2829718589782715, -1.7289726734161377, -1.174973487854004, -0.6209743022918701, -0.06697511672973633, 0.48702406883239746, 1.0410232543945312, 1.595022439956665, 2.149021625518799, 2.7030208110809326, 3.2570199966430664, 3.8110191822052, 4.365018367767334, 4.919017791748047, 5.473016738891602, 6.027015686035156, 6.581015110015869, 7.135014533996582, 7.689013481140137, 8.243012428283691, 8.797012329101562, 9.351011276245117, 9.905010223388672, 10.459009170532227, 11.013008117675781, 11.567008018493652, 12.121006965637207, 12.675005912780762, 13.229005813598633, 13.783004760742188, 14.337003707885742, 14.891002655029297, 15.445001602172852, 15.999001502990723, 16.553001403808594, 17.10700035095215, 17.660999298095703, 18.214998245239258, 18.768997192382812]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 10.0, 13.0, 17.0, 39.0, 53.0, 70.0, 108.0, 183.0, 309.0, 557.0, 986.0, 1872.0, 3613.0, 7145.0, 15603.0, 39884.0, 145500.0, 955857.0, 2497802.0, 398509.0, 77882.0, 26307.0, 11134.0, 5103.0, 2590.0, 1338.0, 759.0, 417.0, 217.0, 154.0, 95.0, 60.0, 21.0, 21.0, 18.0, 9.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5, -1.4586639404296875, -1.417327880859375, -1.3759918212890625, -1.33465576171875, -1.2933197021484375, -1.251983642578125, -1.2106475830078125, -1.1693115234375, -1.1279754638671875, -1.086639404296875, -1.0453033447265625, -1.00396728515625, -0.9626312255859375, -0.921295166015625, -0.8799591064453125, -0.838623046875, -0.7972869873046875, -0.755950927734375, -0.7146148681640625, -0.67327880859375, -0.6319427490234375, -0.590606689453125, -0.5492706298828125, -0.5079345703125, -0.4665985107421875, -0.425262451171875, -0.3839263916015625, -0.34259033203125, -0.3012542724609375, -0.259918212890625, -0.2185821533203125, -0.17724609375, -0.1359100341796875, -0.094573974609375, -0.0532379150390625, -0.01190185546875, 0.0294342041015625, 0.070770263671875, 0.1121063232421875, 0.1534423828125, 0.1947784423828125, 0.236114501953125, 0.2774505615234375, 0.31878662109375, 0.3601226806640625, 0.401458740234375, 0.4427947998046875, 0.484130859375, 0.5254669189453125, 0.566802978515625, 0.6081390380859375, 0.64947509765625, 0.6908111572265625, 0.732147216796875, 0.7734832763671875, 0.8148193359375, 0.8561553955078125, 0.897491455078125, 0.9388275146484375, 0.98016357421875, 1.0214996337890625, 1.062835693359375, 1.1041717529296875, 1.1455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 5.0, 11.0, 11.0, 13.0, 17.0, 12.0, 9.0, 26.0, 23.0, 24.0, 36.0, 35.0, 39.0, 42.0, 39.0, 39.0, 43.0, 47.0, 43.0, 49.0, 30.0, 55.0, 36.0, 48.0, 34.0, 29.0, 23.0, 26.0, 22.0, 15.0, 23.0, 16.0, 13.0, 7.0, 10.0, 3.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.791656494140625, -0.76397705078125, -0.736297607421875, -0.7086181640625, -0.680938720703125, -0.65325927734375, -0.625579833984375, -0.597900390625, -0.570220947265625, -0.54254150390625, -0.514862060546875, -0.4871826171875, -0.459503173828125, -0.43182373046875, -0.404144287109375, -0.37646484375, -0.348785400390625, -0.32110595703125, -0.293426513671875, -0.2657470703125, -0.238067626953125, -0.21038818359375, -0.182708740234375, -0.155029296875, -0.127349853515625, -0.09967041015625, -0.071990966796875, -0.0443115234375, -0.016632080078125, 0.01104736328125, 0.038726806640625, 0.06640625, 0.094085693359375, 0.12176513671875, 0.149444580078125, 0.1771240234375, 0.204803466796875, 0.23248291015625, 0.260162353515625, 0.287841796875, 0.315521240234375, 0.34320068359375, 0.370880126953125, 0.3985595703125, 0.426239013671875, 0.45391845703125, 0.481597900390625, 0.50927734375, 0.536956787109375, 0.56463623046875, 0.592315673828125, 0.6199951171875, 0.647674560546875, 0.67535400390625, 0.703033447265625, 0.730712890625, 0.758392333984375, 0.78607177734375, 0.813751220703125, 0.8414306640625, 0.869110107421875, 0.89678955078125, 0.924468994140625, 0.9521484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 10.0, 15.0, 10.0, 19.0, 30.0, 52.0, 69.0, 99.0, 126.0, 214.0, 403.0, 730.0, 1248.0, 2516.0, 5627.0, 14633.0, 46800.0, 213970.0, 2914582.0, 848451.0, 101392.0, 26944.0, 8954.0, 3493.0, 1684.0, 871.0, 497.0, 292.0, 181.0, 118.0, 67.0, 54.0, 35.0, 24.0, 22.0, 14.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 3.0, 1.0], "bins": [-2.115234375, -2.054412841796875, -1.99359130859375, -1.932769775390625, -1.8719482421875, -1.811126708984375, -1.75030517578125, -1.689483642578125, -1.628662109375, -1.567840576171875, -1.50701904296875, -1.446197509765625, -1.3853759765625, -1.324554443359375, -1.26373291015625, -1.202911376953125, -1.14208984375, -1.081268310546875, -1.02044677734375, -0.959625244140625, -0.8988037109375, -0.837982177734375, -0.77716064453125, -0.716339111328125, -0.655517578125, -0.594696044921875, -0.53387451171875, -0.473052978515625, -0.4122314453125, -0.351409912109375, -0.29058837890625, -0.229766845703125, -0.1689453125, -0.108123779296875, -0.04730224609375, 0.013519287109375, 0.0743408203125, 0.135162353515625, 0.19598388671875, 0.256805419921875, 0.317626953125, 0.378448486328125, 0.43927001953125, 0.500091552734375, 0.5609130859375, 0.621734619140625, 0.68255615234375, 0.743377685546875, 0.80419921875, 0.865020751953125, 0.92584228515625, 0.986663818359375, 1.0474853515625, 1.108306884765625, 1.16912841796875, 1.229949951171875, 1.290771484375, 1.351593017578125, 1.41241455078125, 1.473236083984375, 1.5340576171875, 1.594879150390625, 1.65570068359375, 1.716522216796875, 1.77734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 5.0, 8.0, 8.0, 19.0, 15.0, 36.0, 44.0, 65.0, 91.0, 167.0, 313.0, 598.0, 1049.0, 732.0, 345.0, 190.0, 143.0, 65.0, 37.0, 42.0, 23.0, 22.0, 17.0, 11.0, 9.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.689453125, -3.596405029296875, -3.50335693359375, -3.410308837890625, -3.3172607421875, -3.224212646484375, -3.13116455078125, -3.038116455078125, -2.945068359375, -2.852020263671875, -2.75897216796875, -2.665924072265625, -2.5728759765625, -2.479827880859375, -2.38677978515625, -2.293731689453125, -2.20068359375, -2.107635498046875, -2.01458740234375, -1.921539306640625, -1.8284912109375, -1.735443115234375, -1.64239501953125, -1.549346923828125, -1.456298828125, -1.363250732421875, -1.27020263671875, -1.177154541015625, -1.0841064453125, -0.991058349609375, -0.89801025390625, -0.804962158203125, -0.7119140625, -0.618865966796875, -0.52581787109375, -0.432769775390625, -0.3397216796875, -0.246673583984375, -0.15362548828125, -0.060577392578125, 0.032470703125, 0.125518798828125, 0.21856689453125, 0.311614990234375, 0.4046630859375, 0.497711181640625, 0.59075927734375, 0.683807373046875, 0.77685546875, 0.869903564453125, 0.96295166015625, 1.055999755859375, 1.1490478515625, 1.242095947265625, 1.33514404296875, 1.428192138671875, 1.521240234375, 1.614288330078125, 1.70733642578125, 1.800384521484375, 1.8934326171875, 1.986480712890625, 2.07952880859375, 2.172576904296875, 2.265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 17.0, 61.0, 367.0, 435.0, 87.0, 15.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.178726196289062, -24.17584800720215, -22.172969818115234, -20.170089721679688, -18.167211532592773, -16.16433334350586, -14.161454200744629, -12.158575057983398, -10.155696868896484, -8.15281867980957, -6.14993953704834, -4.147060871124268, -2.1441822052001953, -0.14130401611328125, 1.8615751266479492, 3.8644542694091797, 5.867332458496094, 7.870211124420166, 9.873089790344238, 11.875968933105469, 13.878847122192383, 15.881725311279297, 17.884605407714844, 19.887483596801758, 21.890361785888672, 23.893239974975586, 25.8961181640625, 27.898998260498047, 29.90187644958496, 31.904754638671875, 33.90763473510742, 35.91051483154297, 37.91338348388672, 39.916263580322266, 41.91913986206055, 43.922019958496094, 45.924896240234375, 47.92777633666992, 49.93065643310547, 51.93353271484375, 53.9364128112793, 55.939292907714844, 57.942169189453125, 59.94504928588867, 61.94792938232422, 63.9508056640625, 65.95368194580078, 67.9565658569336, 69.95944213867188, 71.96231842041016, 73.96520233154297, 75.96807861328125, 77.97095489501953, 79.97383117675781, 81.97671508789062, 83.9795913696289, 85.98246765136719, 87.98534393310547, 89.98822784423828, 91.99110412597656, 93.99398040771484, 95.99685668945312, 97.99974060058594, 100.00261688232422, 102.00550079345703]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 16.0, 16.0, 28.0, 25.0, 36.0, 42.0, 37.0, 55.0, 44.0, 58.0, 62.0, 72.0, 78.0, 58.0, 50.0, 55.0, 48.0, 35.0, 37.0, 23.0, 26.0, 20.0, 10.0, 10.0, 7.0, 9.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.574365615844727, -12.098608016967773, -11.622849464416504, -11.14709186553955, -10.671334266662598, -10.195575714111328, -9.719818115234375, -9.244060516357422, -8.768301963806152, -8.2925443649292, -7.816786289215088, -7.341028213500977, -6.865270137786865, -6.389512062072754, -5.913754463195801, -5.4379963874816895, -4.962238788604736, -4.486480712890625, -4.010723114013672, -3.5349650382995605, -3.059206962585449, -2.583449125289917, -2.1076912879943848, -1.6319332122802734, -1.1561753749847412, -0.6804174184799194, -0.20465952157974243, 0.27109837532043457, 0.7468563318252563, 1.2226142883300781, 1.6983721256256104, 2.1741302013397217, 2.649888038635254, 3.125645875930786, 3.6014039516448975, 4.07716178894043, 4.552919864654541, 5.028677940368652, 5.5044355392456055, 5.980193614959717, 6.455951690673828, 6.9317097663879395, 7.407467365264893, 7.883225440979004, 8.358983039855957, 8.834741592407227, 9.31049919128418, 9.786256790161133, 10.262014389038086, 10.737771987915039, 11.213530540466309, 11.689288139343262, 12.165045738220215, 12.640804290771484, 13.116561889648438, 13.59231948852539, 14.06807804107666, 14.543835639953613, 15.019594192504883, 15.495351791381836, 15.971109390258789, 16.446866989135742, 16.922626495361328, 17.39838409423828, 17.874141693115234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 16.0, 18.0, 26.0, 38.0, 61.0, 66.0, 163.0, 212.0, 369.0, 697.0, 1173.0, 2101.0, 3955.0, 8593.0, 19633.0, 49657.0, 133344.0, 348405.0, 298588.0, 108529.0, 41061.0, 16600.0, 7399.0, 3526.0, 1832.0, 992.0, 568.0, 341.0, 222.0, 126.0, 83.0, 55.0, 38.0, 19.0, 23.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2857666015625, -2.214111328125, -2.1424560546875, -2.07080078125, -1.9991455078125, -1.927490234375, -1.8558349609375, -1.7841796875, -1.7125244140625, -1.640869140625, -1.5692138671875, -1.49755859375, -1.4259033203125, -1.354248046875, -1.2825927734375, -1.2109375, -1.1392822265625, -1.067626953125, -0.9959716796875, -0.92431640625, -0.8526611328125, -0.781005859375, -0.7093505859375, -0.6376953125, -0.5660400390625, -0.494384765625, -0.4227294921875, -0.35107421875, -0.2794189453125, -0.207763671875, -0.1361083984375, -0.064453125, 0.0072021484375, 0.078857421875, 0.1505126953125, 0.22216796875, 0.2938232421875, 0.365478515625, 0.4371337890625, 0.5087890625, 0.5804443359375, 0.652099609375, 0.7237548828125, 0.79541015625, 0.8670654296875, 0.938720703125, 1.0103759765625, 1.08203125, 1.1536865234375, 1.225341796875, 1.2969970703125, 1.36865234375, 1.4403076171875, 1.511962890625, 1.5836181640625, 1.6552734375, 1.7269287109375, 1.798583984375, 1.8702392578125, 1.94189453125, 2.0135498046875, 2.085205078125, 2.1568603515625, 2.228515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 9.0, 8.0, 15.0, 12.0, 12.0, 15.0, 18.0, 22.0, 19.0, 30.0, 35.0, 30.0, 33.0, 45.0, 37.0, 44.0, 37.0, 35.0, 47.0, 44.0, 39.0, 46.0, 38.0, 36.0, 29.0, 43.0, 25.0, 23.0, 22.0, 18.0, 10.0, 20.0, 9.0, 12.0, 19.0, 5.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.775390625, -0.7483978271484375, -0.721405029296875, -0.6944122314453125, -0.66741943359375, -0.6404266357421875, -0.613433837890625, -0.5864410400390625, -0.5594482421875, -0.5324554443359375, -0.505462646484375, -0.4784698486328125, -0.45147705078125, -0.4244842529296875, -0.397491455078125, -0.3704986572265625, -0.343505859375, -0.3165130615234375, -0.289520263671875, -0.2625274658203125, -0.23553466796875, -0.2085418701171875, -0.181549072265625, -0.1545562744140625, -0.1275634765625, -0.1005706787109375, -0.073577880859375, -0.0465850830078125, -0.01959228515625, 0.0074005126953125, 0.034393310546875, 0.0613861083984375, 0.08837890625, 0.1153717041015625, 0.142364501953125, 0.1693572998046875, 0.19635009765625, 0.2233428955078125, 0.250335693359375, 0.2773284912109375, 0.3043212890625, 0.3313140869140625, 0.358306884765625, 0.3852996826171875, 0.41229248046875, 0.4392852783203125, 0.466278076171875, 0.4932708740234375, 0.520263671875, 0.5472564697265625, 0.574249267578125, 0.6012420654296875, 0.62823486328125, 0.6552276611328125, 0.682220458984375, 0.7092132568359375, 0.7362060546875, 0.7631988525390625, 0.790191650390625, 0.8171844482421875, 0.84417724609375, 0.8711700439453125, 0.898162841796875, 0.9251556396484375, 0.9521484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 9.0, 5.0, 12.0, 9.0, 19.0, 28.0, 38.0, 57.0, 77.0, 107.0, 163.0, 270.0, 415.0, 765.0, 1464.0, 3052.0, 8798.0, 40557.0, 352553.0, 574170.0, 49101.0, 9931.0, 3376.0, 1510.0, 757.0, 467.0, 259.0, 171.0, 141.0, 76.0, 45.0, 33.0, 35.0, 18.0, 13.0, 17.0, 14.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.6328125, -4.500640869140625, -4.36846923828125, -4.236297607421875, -4.1041259765625, -3.971954345703125, -3.83978271484375, -3.707611083984375, -3.575439453125, -3.443267822265625, -3.31109619140625, -3.178924560546875, -3.0467529296875, -2.914581298828125, -2.78240966796875, -2.650238037109375, -2.51806640625, -2.385894775390625, -2.25372314453125, -2.121551513671875, -1.9893798828125, -1.857208251953125, -1.72503662109375, -1.592864990234375, -1.460693359375, -1.328521728515625, -1.19635009765625, -1.064178466796875, -0.9320068359375, -0.799835205078125, -0.66766357421875, -0.535491943359375, -0.4033203125, -0.271148681640625, -0.13897705078125, -0.006805419921875, 0.1253662109375, 0.257537841796875, 0.38970947265625, 0.521881103515625, 0.654052734375, 0.786224365234375, 0.91839599609375, 1.050567626953125, 1.1827392578125, 1.314910888671875, 1.44708251953125, 1.579254150390625, 1.71142578125, 1.843597412109375, 1.97576904296875, 2.107940673828125, 2.2401123046875, 2.372283935546875, 2.50445556640625, 2.636627197265625, 2.768798828125, 2.900970458984375, 3.03314208984375, 3.165313720703125, 3.2974853515625, 3.429656982421875, 3.56182861328125, 3.694000244140625, 3.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 17.0, 19.0, 40.0, 31.0, 49.0, 52.0, 65.0, 80.0, 63.0, 62.0, 55.0, 72.0, 67.0, 46.0, 56.0, 47.0, 34.0, 20.0, 25.0, 16.0, 12.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.58203125, -3.41015625, -3.23828125, -3.06640625, -2.89453125, -2.72265625, -2.55078125, -2.37890625, -2.20703125, -2.03515625, -1.86328125, -1.69140625, -1.51953125, -1.34765625, -1.17578125, -1.00390625, -0.83203125, -0.66015625, -0.48828125, -0.31640625, -0.14453125, 0.02734375, 0.19921875, 0.37109375, 0.54296875, 0.71484375, 0.88671875, 1.05859375, 1.23046875, 1.40234375, 1.57421875, 1.74609375, 1.91796875, 2.08984375, 2.26171875, 2.43359375, 2.60546875, 2.77734375, 2.94921875, 3.12109375, 3.29296875, 3.46484375, 3.63671875, 3.80859375, 3.98046875, 4.15234375, 4.32421875, 4.49609375, 4.66796875, 4.83984375, 5.01171875, 5.18359375, 5.35546875, 5.52734375, 5.69921875, 5.87109375, 6.04296875, 6.21484375, 6.38671875, 6.55859375, 6.73046875, 6.90234375, 7.07421875, 7.24609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 6.0, 7.0, 10.0, 11.0, 17.0, 17.0, 38.0, 58.0, 72.0, 117.0, 204.0, 430.0, 928.0, 2449.0, 9781.0, 73085.0, 785000.0, 154532.0, 15834.0, 3560.0, 1225.0, 464.0, 289.0, 133.0, 85.0, 67.0, 39.0, 23.0, 16.0, 16.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.423828125, -1.3788299560546875, -1.333831787109375, -1.2888336181640625, -1.24383544921875, -1.1988372802734375, -1.153839111328125, -1.1088409423828125, -1.0638427734375, -1.0188446044921875, -0.973846435546875, -0.9288482666015625, -0.88385009765625, -0.8388519287109375, -0.793853759765625, -0.7488555908203125, -0.703857421875, -0.6588592529296875, -0.613861083984375, -0.5688629150390625, -0.52386474609375, -0.4788665771484375, -0.433868408203125, -0.3888702392578125, -0.3438720703125, -0.2988739013671875, -0.253875732421875, -0.2088775634765625, -0.16387939453125, -0.1188812255859375, -0.073883056640625, -0.0288848876953125, 0.01611328125, 0.0611114501953125, 0.106109619140625, 0.1511077880859375, 0.19610595703125, 0.2411041259765625, 0.286102294921875, 0.3311004638671875, 0.3760986328125, 0.4210968017578125, 0.466094970703125, 0.5110931396484375, 0.55609130859375, 0.6010894775390625, 0.646087646484375, 0.6910858154296875, 0.736083984375, 0.7810821533203125, 0.826080322265625, 0.8710784912109375, 0.91607666015625, 0.9610748291015625, 1.006072998046875, 1.0510711669921875, 1.0960693359375, 1.1410675048828125, 1.186065673828125, 1.2310638427734375, 1.27606201171875, 1.3210601806640625, 1.366058349609375, 1.4110565185546875, 1.4560546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 8.0, 13.0, 16.0, 10.0, 18.0, 18.0, 38.0, 29.0, 54.0, 49.0, 72.0, 94.0, 98.0, 110.0, 82.0, 65.0, 45.0, 44.0, 30.0, 22.0, 14.0, 9.0, 11.0, 3.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002732276916503906, -0.0002643391489982605, -0.00025545060634613037, -0.00024656206369400024, -0.00023767352104187012, -0.00022878497838974, -0.00021989643573760986, -0.00021100789308547974, -0.0002021193504333496, -0.00019323080778121948, -0.00018434226512908936, -0.00017545372247695923, -0.0001665651798248291, -0.00015767663717269897, -0.00014878809452056885, -0.00013989955186843872, -0.0001310110092163086, -0.00012212246656417847, -0.00011323392391204834, -0.00010434538125991821, -9.545683860778809e-05, -8.656829595565796e-05, -7.767975330352783e-05, -6.87912106513977e-05, -5.990266799926758e-05, -5.101412534713745e-05, -4.2125582695007324e-05, -3.32370400428772e-05, -2.434849739074707e-05, -1.5459954738616943e-05, -6.571412086486816e-06, 2.3171305656433105e-06, 1.1205673217773438e-05, 2.0094215869903564e-05, 2.898275852203369e-05, 3.787130117416382e-05, 4.6759843826293945e-05, 5.564838647842407e-05, 6.45369291305542e-05, 7.342547178268433e-05, 8.231401443481445e-05, 9.120255708694458e-05, 0.00010009109973907471, 0.00010897964239120483, 0.00011786818504333496, 0.0001267567276954651, 0.00013564527034759521, 0.00014453381299972534, 0.00015342235565185547, 0.0001623108983039856, 0.00017119944095611572, 0.00018008798360824585, 0.00018897652626037598, 0.0001978650689125061, 0.00020675361156463623, 0.00021564215421676636, 0.00022453069686889648, 0.0002334192395210266, 0.00024230778217315674, 0.00025119632482528687, 0.000260084867477417, 0.0002689734101295471, 0.00027786195278167725, 0.0002867504954338074, 0.0002956390380859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 5.0, 11.0, 8.0, 18.0, 17.0, 36.0, 38.0, 78.0, 154.0, 274.0, 566.0, 1312.0, 3571.0, 16881.0, 219435.0, 750982.0, 45001.0, 6542.0, 1949.0, 831.0, 357.0, 212.0, 116.0, 48.0, 34.0, 24.0, 21.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5314178466796875, -1.486663818359375, -1.4419097900390625, -1.39715576171875, -1.3524017333984375, -1.307647705078125, -1.2628936767578125, -1.2181396484375, -1.1733856201171875, -1.128631591796875, -1.0838775634765625, -1.03912353515625, -0.9943695068359375, -0.949615478515625, -0.9048614501953125, -0.860107421875, -0.8153533935546875, -0.770599365234375, -0.7258453369140625, -0.68109130859375, -0.6363372802734375, -0.591583251953125, -0.5468292236328125, -0.5020751953125, -0.4573211669921875, -0.412567138671875, -0.3678131103515625, -0.32305908203125, -0.2783050537109375, -0.233551025390625, -0.1887969970703125, -0.14404296875, -0.0992889404296875, -0.054534912109375, -0.0097808837890625, 0.03497314453125, 0.0797271728515625, 0.124481201171875, 0.1692352294921875, 0.2139892578125, 0.2587432861328125, 0.303497314453125, 0.3482513427734375, 0.39300537109375, 0.4377593994140625, 0.482513427734375, 0.5272674560546875, 0.572021484375, 0.6167755126953125, 0.661529541015625, 0.7062835693359375, 0.75103759765625, 0.7957916259765625, 0.840545654296875, 0.8852996826171875, 0.9300537109375, 0.9748077392578125, 1.019561767578125, 1.0643157958984375, 1.10906982421875, 1.1538238525390625, 1.198577880859375, 1.2433319091796875, 1.2880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 15.0, 17.0, 25.0, 42.0, 51.0, 72.0, 93.0, 104.0, 121.0, 110.0, 104.0, 80.0, 52.0, 27.0, 27.0, 25.0, 15.0, 3.0, 7.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.451171875, -2.401702880859375, -2.35223388671875, -2.302764892578125, -2.2532958984375, -2.203826904296875, -2.15435791015625, -2.104888916015625, -2.055419921875, -2.005950927734375, -1.95648193359375, -1.907012939453125, -1.8575439453125, -1.808074951171875, -1.75860595703125, -1.709136962890625, -1.65966796875, -1.610198974609375, -1.56072998046875, -1.511260986328125, -1.4617919921875, -1.412322998046875, -1.36285400390625, -1.313385009765625, -1.263916015625, -1.214447021484375, -1.16497802734375, -1.115509033203125, -1.0660400390625, -1.016571044921875, -0.96710205078125, -0.917633056640625, -0.8681640625, -0.818695068359375, -0.76922607421875, -0.719757080078125, -0.6702880859375, -0.620819091796875, -0.57135009765625, -0.521881103515625, -0.472412109375, -0.422943115234375, -0.37347412109375, -0.324005126953125, -0.2745361328125, -0.225067138671875, -0.17559814453125, -0.126129150390625, -0.07666015625, -0.027191162109375, 0.02227783203125, 0.071746826171875, 0.1212158203125, 0.170684814453125, 0.22015380859375, 0.269622802734375, 0.319091796875, 0.368560791015625, 0.41802978515625, 0.467498779296875, 0.5169677734375, 0.566436767578125, 0.61590576171875, 0.665374755859375, 0.71484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 10.0, 8.0, 8.0, 8.0, 13.0, 30.0, 52.0, 117.0, 189.0, 276.0, 125.0, 77.0, 41.0, 20.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.426483154296875, -24.557722091674805, -23.688961029052734, -22.820199966430664, -21.951438903808594, -21.08267593383789, -20.21391487121582, -19.34515380859375, -18.47639274597168, -17.60763168334961, -16.73887062072754, -15.870108604431152, -15.001347541809082, -14.132586479187012, -13.263824462890625, -12.395063400268555, -11.526302337646484, -10.657541275024414, -9.788780212402344, -8.920018196105957, -8.051257133483887, -7.182496070861816, -6.313734531402588, -5.444972991943359, -4.576211929321289, -3.7074506282806396, -2.8386893272399902, -1.9699280261993408, -1.1011667251586914, -0.2324056625366211, 0.6363558769226074, 1.505117416381836, 2.373880386352539, 3.2426416873931885, 4.111402988433838, 4.980164527893066, 5.848925590515137, 6.717686653137207, 7.5864481925964355, 8.455209732055664, 9.323970794677734, 10.192731857299805, 11.061492919921875, 11.930254936218262, 12.799015998840332, 13.667777061462402, 14.536539077758789, 15.40530014038086, 16.27406120300293, 17.142822265625, 18.01158332824707, 18.88034439086914, 19.749107360839844, 20.61786651611328, 21.486629486083984, 22.355390548706055, 23.224151611328125, 24.092912673950195, 24.961673736572266, 25.830434799194336, 26.699195861816406, 27.56795883178711, 28.43671989440918, 29.30548095703125, 30.17424201965332]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 10.0, 12.0, 8.0, 14.0, 18.0, 11.0, 21.0, 20.0, 25.0, 27.0, 25.0, 22.0, 32.0, 42.0, 45.0, 63.0, 66.0, 67.0, 58.0, 61.0, 43.0, 39.0, 33.0, 31.0, 22.0, 22.0, 18.0, 16.0, 12.0, 18.0, 6.0, 13.0, 16.0, 10.0, 6.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.952184677124023, -13.482481956481934, -13.01278018951416, -12.54307746887207, -12.073375701904297, -11.603672981262207, -11.133970260620117, -10.664268493652344, -10.19456672668457, -9.72486400604248, -9.255162239074707, -8.785459518432617, -8.315757751464844, -7.846055030822754, -7.376352787017822, -6.906650543212891, -6.436947822570801, -5.967245578765869, -5.4975433349609375, -5.027840614318848, -4.558138847351074, -4.088436126708984, -3.6187338829040527, -3.149031639099121, -2.6793293952941895, -2.209627151489258, -1.7399247884750366, -1.2702224254608154, -0.8005201816558838, -0.33081793785095215, 0.1388845443725586, 0.6085867881774902, 1.0782890319824219, 1.5479912757873535, 2.017693519592285, 2.487396001815796, 2.9570982456207275, 3.426800489425659, 3.89650297164917, 4.366205215454102, 4.835907459259033, 5.305609703063965, 5.7753119468688965, 6.245014190673828, 6.714716911315918, 7.184418678283691, 7.654121398925781, 8.123823165893555, 8.593525886535645, 9.063228607177734, 9.532930374145508, 10.002633094787598, 10.472334861755371, 10.942037582397461, 11.411739349365234, 11.881442070007324, 12.351144790649414, 12.820847511291504, 13.290549278259277, 13.760251998901367, 14.22995376586914, 14.69965648651123, 15.16935920715332, 15.639060974121094, 16.108762741088867]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 10.0, 17.0, 26.0, 42.0, 43.0, 100.0, 99.0, 143.0, 255.0, 355.0, 617.0, 1229.0, 2360.0, 4830.0, 11125.0, 32768.0, 185089.0, 2107797.0, 1657682.0, 142503.0, 27958.0, 9977.0, 4261.0, 2161.0, 1069.0, 632.0, 383.0, 225.0, 163.0, 85.0, 77.0, 50.0, 33.0, 27.0, 11.0, 6.0, 10.0, 8.0, 6.0, 4.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.34765625, -1.304107666015625, -1.26055908203125, -1.217010498046875, -1.1734619140625, -1.129913330078125, -1.08636474609375, -1.042816162109375, -0.999267578125, -0.955718994140625, -0.91217041015625, -0.868621826171875, -0.8250732421875, -0.781524658203125, -0.73797607421875, -0.694427490234375, -0.65087890625, -0.607330322265625, -0.56378173828125, -0.520233154296875, -0.4766845703125, -0.433135986328125, -0.38958740234375, -0.346038818359375, -0.302490234375, -0.258941650390625, -0.21539306640625, -0.171844482421875, -0.1282958984375, -0.084747314453125, -0.04119873046875, 0.002349853515625, 0.0458984375, 0.089447021484375, 0.13299560546875, 0.176544189453125, 0.2200927734375, 0.263641357421875, 0.30718994140625, 0.350738525390625, 0.394287109375, 0.437835693359375, 0.48138427734375, 0.524932861328125, 0.5684814453125, 0.612030029296875, 0.65557861328125, 0.699127197265625, 0.74267578125, 0.786224365234375, 0.82977294921875, 0.873321533203125, 0.9168701171875, 0.960418701171875, 1.00396728515625, 1.047515869140625, 1.091064453125, 1.134613037109375, 1.17816162109375, 1.221710205078125, 1.2652587890625, 1.308807373046875, 1.35235595703125, 1.395904541015625, 1.439453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 10.0, 6.0, 5.0, 14.0, 12.0, 12.0, 18.0, 28.0, 23.0, 28.0, 30.0, 33.0, 41.0, 38.0, 47.0, 38.0, 31.0, 41.0, 38.0, 41.0, 43.0, 50.0, 40.0, 39.0, 37.0, 31.0, 26.0, 37.0, 19.0, 26.0, 15.0, 19.0, 10.0, 15.0, 15.0, 10.0, 9.0, 7.0, 2.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8381881713867188, -0.8121185302734375, -0.7860488891601562, -0.759979248046875, -0.7339096069335938, -0.7078399658203125, -0.6817703247070312, -0.65570068359375, -0.6296310424804688, -0.6035614013671875, -0.5774917602539062, -0.551422119140625, -0.5253524780273438, -0.4992828369140625, -0.47321319580078125, -0.4471435546875, -0.42107391357421875, -0.3950042724609375, -0.36893463134765625, -0.342864990234375, -0.31679534912109375, -0.2907257080078125, -0.26465606689453125, -0.23858642578125, -0.21251678466796875, -0.1864471435546875, -0.16037750244140625, -0.134307861328125, -0.10823822021484375, -0.0821685791015625, -0.05609893798828125, -0.030029296875, -0.00395965576171875, 0.0221099853515625, 0.04817962646484375, 0.074249267578125, 0.10031890869140625, 0.1263885498046875, 0.15245819091796875, 0.17852783203125, 0.20459747314453125, 0.2306671142578125, 0.25673675537109375, 0.282806396484375, 0.30887603759765625, 0.3349456787109375, 0.36101531982421875, 0.3870849609375, 0.41315460205078125, 0.4392242431640625, 0.46529388427734375, 0.491363525390625, 0.5174331665039062, 0.5435028076171875, 0.5695724487304688, 0.59564208984375, 0.6217117309570312, 0.6477813720703125, 0.6738510131835938, 0.699920654296875, 0.7259902954101562, 0.7520599365234375, 0.7781295776367188, 0.80419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 13.0, 21.0, 32.0, 58.0, 116.0, 220.0, 499.0, 1294.0, 4324.0, 20560.0, 244331.0, 3795917.0, 107968.0, 13534.0, 3279.0, 1156.0, 463.0, 224.0, 101.0, 61.0, 39.0, 18.0, 15.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.958984375, -3.858428955078125, -3.75787353515625, -3.657318115234375, -3.5567626953125, -3.456207275390625, -3.35565185546875, -3.255096435546875, -3.154541015625, -3.053985595703125, -2.95343017578125, -2.852874755859375, -2.7523193359375, -2.651763916015625, -2.55120849609375, -2.450653076171875, -2.35009765625, -2.249542236328125, -2.14898681640625, -2.048431396484375, -1.9478759765625, -1.847320556640625, -1.74676513671875, -1.646209716796875, -1.545654296875, -1.445098876953125, -1.34454345703125, -1.243988037109375, -1.1434326171875, -1.042877197265625, -0.94232177734375, -0.841766357421875, -0.7412109375, -0.640655517578125, -0.54010009765625, -0.439544677734375, -0.3389892578125, -0.238433837890625, -0.13787841796875, -0.037322998046875, 0.063232421875, 0.163787841796875, 0.26434326171875, 0.364898681640625, 0.4654541015625, 0.566009521484375, 0.66656494140625, 0.767120361328125, 0.86767578125, 0.968231201171875, 1.06878662109375, 1.169342041015625, 1.2698974609375, 1.370452880859375, 1.47100830078125, 1.571563720703125, 1.672119140625, 1.772674560546875, 1.87322998046875, 1.973785400390625, 2.0743408203125, 2.174896240234375, 2.27545166015625, 2.376007080078125, 2.4765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 9.0, 16.0, 12.0, 22.0, 36.0, 55.0, 90.0, 132.0, 323.0, 692.0, 1145.0, 792.0, 309.0, 153.0, 94.0, 57.0, 30.0, 24.0, 20.0, 15.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.676788330078125, -2.59185791015625, -2.506927490234375, -2.4219970703125, -2.337066650390625, -2.25213623046875, -2.167205810546875, -2.082275390625, -1.997344970703125, -1.91241455078125, -1.827484130859375, -1.7425537109375, -1.657623291015625, -1.57269287109375, -1.487762451171875, -1.40283203125, -1.317901611328125, -1.23297119140625, -1.148040771484375, -1.0631103515625, -0.978179931640625, -0.89324951171875, -0.808319091796875, -0.723388671875, -0.638458251953125, -0.55352783203125, -0.468597412109375, -0.3836669921875, -0.298736572265625, -0.21380615234375, -0.128875732421875, -0.0439453125, 0.040985107421875, 0.12591552734375, 0.210845947265625, 0.2957763671875, 0.380706787109375, 0.46563720703125, 0.550567626953125, 0.635498046875, 0.720428466796875, 0.80535888671875, 0.890289306640625, 0.9752197265625, 1.060150146484375, 1.14508056640625, 1.230010986328125, 1.31494140625, 1.399871826171875, 1.48480224609375, 1.569732666015625, 1.6546630859375, 1.739593505859375, 1.82452392578125, 1.909454345703125, 1.994384765625, 2.079315185546875, 2.16424560546875, 2.249176025390625, 2.3341064453125, 2.419036865234375, 2.50396728515625, 2.588897705078125, 2.673828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 20.0, 46.0, 215.0, 394.0, 224.0, 52.0, 12.0, 13.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.07345962524414, -15.891817092895508, -14.710174560546875, -13.528532028198242, -12.34688949584961, -11.165246963500977, -9.983604431152344, -8.801961898803711, -7.620319366455078, -6.438676834106445, -5.2570343017578125, -4.07539176940918, -2.893749237060547, -1.712106704711914, -0.5304641723632812, 0.6511783599853516, 1.8328208923339844, 3.014463424682617, 4.19610595703125, 5.377748489379883, 6.559391021728516, 7.741033554077148, 8.922676086425781, 10.104318618774414, 11.285961151123047, 12.46760368347168, 13.649246215820312, 14.830888748168945, 16.012531280517578, 17.19417381286621, 18.375816345214844, 19.557458877563477, 20.739105224609375, 21.920747756958008, 23.10239028930664, 24.284032821655273, 25.465675354003906, 26.64731788635254, 27.828960418701172, 29.010602951049805, 30.192245483398438, 31.37388801574707, 32.5555305480957, 33.73717498779297, 34.91881561279297, 36.10045623779297, 37.282100677490234, 38.4637451171875, 39.6453857421875, 40.8270263671875, 42.008670806884766, 43.19031524658203, 44.37195587158203, 45.55359649658203, 46.7352409362793, 47.91688537597656, 49.09852600097656, 50.28016662597656, 51.46181106567383, 52.643455505371094, 53.825096130371094, 55.006736755371094, 56.18838119506836, 57.370025634765625, 58.551666259765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 9.0, 10.0, 20.0, 26.0, 23.0, 25.0, 36.0, 31.0, 55.0, 57.0, 65.0, 74.0, 45.0, 56.0, 61.0, 60.0, 66.0, 44.0, 39.0, 42.0, 31.0, 23.0, 32.0, 18.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.715545654296875, -11.338780403137207, -10.962014198303223, -10.585248947143555, -10.20848274230957, -9.831717491149902, -9.454952239990234, -9.07818603515625, -8.701420783996582, -8.324655532836914, -7.94788932800293, -7.571124076843262, -7.1943583488464355, -6.817592620849609, -6.440827369689941, -6.064061641693115, -5.687295913696289, -5.310530185699463, -4.933764457702637, -4.556999206542969, -4.180233478546143, -3.8034677505493164, -3.4267022609710693, -3.0499367713928223, -2.673171043395996, -2.29640531539917, -1.9196398258209229, -1.5428742170333862, -1.1661086082458496, -0.789342999458313, -0.41257739067077637, -0.0358119010925293, 0.3409538269042969, 0.7177194356918335, 1.0944850444793701, 1.4712506532669067, 1.8480162620544434, 2.2247819900512695, 2.6015474796295166, 2.9783129692077637, 3.35507869720459, 3.731844425201416, 4.108610153198242, 4.48537540435791, 4.862141132354736, 5.2389068603515625, 5.6156721115112305, 5.992437839508057, 6.369203567504883, 6.745969295501709, 7.122735023498535, 7.499500274658203, 7.876266002655029, 8.253031730651855, 8.629796981811523, 9.006563186645508, 9.383328437805176, 9.760093688964844, 10.136859893798828, 10.513625144958496, 10.890390396118164, 11.267156600952148, 11.643921852111816, 12.020687103271484, 12.397453308105469]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 7.0, 24.0, 26.0, 48.0, 65.0, 99.0, 144.0, 238.0, 361.0, 585.0, 994.0, 1726.0, 3041.0, 6079.0, 12941.0, 30511.0, 74703.0, 184718.0, 343298.0, 226165.0, 93869.0, 37533.0, 15621.0, 7269.0, 3674.0, 1977.0, 1103.0, 619.0, 417.0, 256.0, 158.0, 97.0, 55.0, 51.0, 26.0, 11.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.376983642578125, -1.32525634765625, -1.273529052734375, -1.2218017578125, -1.170074462890625, -1.11834716796875, -1.066619873046875, -1.014892578125, -0.963165283203125, -0.91143798828125, -0.859710693359375, -0.8079833984375, -0.756256103515625, -0.70452880859375, -0.652801513671875, -0.60107421875, -0.549346923828125, -0.49761962890625, -0.445892333984375, -0.3941650390625, -0.342437744140625, -0.29071044921875, -0.238983154296875, -0.187255859375, -0.135528564453125, -0.08380126953125, -0.032073974609375, 0.0196533203125, 0.071380615234375, 0.12310791015625, 0.174835205078125, 0.2265625, 0.278289794921875, 0.33001708984375, 0.381744384765625, 0.4334716796875, 0.485198974609375, 0.53692626953125, 0.588653564453125, 0.640380859375, 0.692108154296875, 0.74383544921875, 0.795562744140625, 0.8472900390625, 0.899017333984375, 0.95074462890625, 1.002471923828125, 1.05419921875, 1.105926513671875, 1.15765380859375, 1.209381103515625, 1.2611083984375, 1.312835693359375, 1.36456298828125, 1.416290283203125, 1.468017578125, 1.519744873046875, 1.57147216796875, 1.623199462890625, 1.6749267578125, 1.726654052734375, 1.77838134765625, 1.830108642578125, 1.8818359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 13.0, 11.0, 6.0, 11.0, 20.0, 16.0, 21.0, 29.0, 38.0, 26.0, 33.0, 33.0, 42.0, 31.0, 42.0, 33.0, 38.0, 40.0, 40.0, 41.0, 44.0, 56.0, 37.0, 40.0, 23.0, 22.0, 19.0, 27.0, 27.0, 20.0, 15.0, 19.0, 18.0, 5.0, 16.0, 5.0, 9.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.85009765625, -0.82452392578125, -0.7989501953125, -0.77337646484375, -0.747802734375, -0.72222900390625, -0.6966552734375, -0.67108154296875, -0.6455078125, -0.61993408203125, -0.5943603515625, -0.56878662109375, -0.543212890625, -0.51763916015625, -0.4920654296875, -0.46649169921875, -0.44091796875, -0.41534423828125, -0.3897705078125, -0.36419677734375, -0.338623046875, -0.31304931640625, -0.2874755859375, -0.26190185546875, -0.236328125, -0.21075439453125, -0.1851806640625, -0.15960693359375, -0.134033203125, -0.10845947265625, -0.0828857421875, -0.05731201171875, -0.03173828125, -0.00616455078125, 0.0194091796875, 0.04498291015625, 0.070556640625, 0.09613037109375, 0.1217041015625, 0.14727783203125, 0.1728515625, 0.19842529296875, 0.2239990234375, 0.24957275390625, 0.275146484375, 0.30072021484375, 0.3262939453125, 0.35186767578125, 0.37744140625, 0.40301513671875, 0.4285888671875, 0.45416259765625, 0.479736328125, 0.50531005859375, 0.5308837890625, 0.55645751953125, 0.58203125, 0.60760498046875, 0.6331787109375, 0.65875244140625, 0.684326171875, 0.70989990234375, 0.7354736328125, 0.76104736328125, 0.78662109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 10.0, 11.0, 18.0, 29.0, 21.0, 28.0, 32.0, 79.0, 109.0, 199.0, 313.0, 610.0, 1442.0, 3994.0, 14153.0, 65017.0, 446367.0, 430308.0, 64650.0, 14088.0, 4072.0, 1492.0, 602.0, 310.0, 174.0, 120.0, 69.0, 53.0, 41.0, 40.0, 26.0, 19.0, 14.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.396484375, -2.3138427734375, -2.231201171875, -2.1485595703125, -2.06591796875, -1.9832763671875, -1.900634765625, -1.8179931640625, -1.7353515625, -1.6527099609375, -1.570068359375, -1.4874267578125, -1.40478515625, -1.3221435546875, -1.239501953125, -1.1568603515625, -1.07421875, -0.9915771484375, -0.908935546875, -0.8262939453125, -0.74365234375, -0.6610107421875, -0.578369140625, -0.4957275390625, -0.4130859375, -0.3304443359375, -0.247802734375, -0.1651611328125, -0.08251953125, 0.0001220703125, 0.082763671875, 0.1654052734375, 0.248046875, 0.3306884765625, 0.413330078125, 0.4959716796875, 0.57861328125, 0.6612548828125, 0.743896484375, 0.8265380859375, 0.9091796875, 0.9918212890625, 1.074462890625, 1.1571044921875, 1.23974609375, 1.3223876953125, 1.405029296875, 1.4876708984375, 1.5703125, 1.6529541015625, 1.735595703125, 1.8182373046875, 1.90087890625, 1.9835205078125, 2.066162109375, 2.1488037109375, 2.2314453125, 2.3140869140625, 2.396728515625, 2.4793701171875, 2.56201171875, 2.6446533203125, 2.727294921875, 2.8099365234375, 2.892578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 12.0, 15.0, 16.0, 22.0, 22.0, 26.0, 42.0, 35.0, 37.0, 48.0, 47.0, 53.0, 57.0, 51.0, 62.0, 50.0, 43.0, 50.0, 50.0, 43.0, 29.0, 38.0, 19.0, 21.0, 20.0, 15.0, 15.0, 11.0, 5.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.224029541015625, -3.11993408203125, -3.015838623046875, -2.9117431640625, -2.807647705078125, -2.70355224609375, -2.599456787109375, -2.495361328125, -2.391265869140625, -2.28717041015625, -2.183074951171875, -2.0789794921875, -1.974884033203125, -1.87078857421875, -1.766693115234375, -1.66259765625, -1.558502197265625, -1.45440673828125, -1.350311279296875, -1.2462158203125, -1.142120361328125, -1.03802490234375, -0.933929443359375, -0.829833984375, -0.725738525390625, -0.62164306640625, -0.517547607421875, -0.4134521484375, -0.309356689453125, -0.20526123046875, -0.101165771484375, 0.0029296875, 0.107025146484375, 0.21112060546875, 0.315216064453125, 0.4193115234375, 0.523406982421875, 0.62750244140625, 0.731597900390625, 0.835693359375, 0.939788818359375, 1.04388427734375, 1.147979736328125, 1.2520751953125, 1.356170654296875, 1.46026611328125, 1.564361572265625, 1.66845703125, 1.772552490234375, 1.87664794921875, 1.980743408203125, 2.0848388671875, 2.188934326171875, 2.29302978515625, 2.397125244140625, 2.501220703125, 2.605316162109375, 2.70941162109375, 2.813507080078125, 2.9176025390625, 3.021697998046875, 3.12579345703125, 3.229888916015625, 3.333984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 22.0, 18.0, 24.0, 48.0, 82.0, 164.0, 294.0, 660.0, 1821.0, 5890.0, 27403.0, 182467.0, 702981.0, 103218.0, 16943.0, 4056.0, 1351.0, 505.0, 258.0, 147.0, 71.0, 43.0, 20.0, 18.0, 10.0, 11.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7683029174804688, -0.7402191162109375, -0.7121353149414062, -0.684051513671875, -0.6559677124023438, -0.6278839111328125, -0.5998001098632812, -0.57171630859375, -0.5436325073242188, -0.5155487060546875, -0.48746490478515625, -0.459381103515625, -0.43129730224609375, -0.4032135009765625, -0.37512969970703125, -0.3470458984375, -0.31896209716796875, -0.2908782958984375, -0.26279449462890625, -0.234710693359375, -0.20662689208984375, -0.1785430908203125, -0.15045928955078125, -0.12237548828125, -0.09429168701171875, -0.0662078857421875, -0.03812408447265625, -0.010040283203125, 0.01804351806640625, 0.0461273193359375, 0.07421112060546875, 0.102294921875, 0.13037872314453125, 0.1584625244140625, 0.18654632568359375, 0.214630126953125, 0.24271392822265625, 0.2707977294921875, 0.29888153076171875, 0.32696533203125, 0.35504913330078125, 0.3831329345703125, 0.41121673583984375, 0.439300537109375, 0.46738433837890625, 0.4954681396484375, 0.5235519409179688, 0.5516357421875, 0.5797195434570312, 0.6078033447265625, 0.6358871459960938, 0.663970947265625, 0.6920547485351562, 0.7201385498046875, 0.7482223510742188, 0.77630615234375, 0.8043899536132812, 0.8324737548828125, 0.8605575561523438, 0.888641357421875, 0.9167251586914062, 0.9448089599609375, 0.9728927612304688, 1.0009765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 8.0, 15.0, 19.0, 24.0, 38.0, 58.0, 80.0, 107.0, 132.0, 124.0, 119.0, 92.0, 49.0, 32.0, 21.0, 13.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031828880310058594, -0.0003085993230342865, -0.00029890984296798706, -0.0002892203629016876, -0.0002795308828353882, -0.00026984140276908875, -0.0002601519227027893, -0.00025046244263648987, -0.00024077296257019043, -0.000231083482503891, -0.00022139400243759155, -0.00021170452237129211, -0.00020201504230499268, -0.00019232556223869324, -0.0001826360821723938, -0.00017294660210609436, -0.00016325712203979492, -0.00015356764197349548, -0.00014387816190719604, -0.0001341886818408966, -0.00012449920177459717, -0.00011480972170829773, -0.00010512024164199829, -9.543076157569885e-05, -8.574128150939941e-05, -7.605180144309998e-05, -6.636232137680054e-05, -5.66728413105011e-05, -4.698336124420166e-05, -3.729388117790222e-05, -2.7604401111602783e-05, -1.7914921045303345e-05, -8.225440979003906e-06, 1.4640390872955322e-06, 1.115351915359497e-05, 2.084299921989441e-05, 3.053247928619385e-05, 4.0221959352493286e-05, 4.9911439418792725e-05, 5.960091948509216e-05, 6.92903995513916e-05, 7.897987961769104e-05, 8.866935968399048e-05, 9.835883975028992e-05, 0.00010804831981658936, 0.0001177377998828888, 0.00012742727994918823, 0.00013711676001548767, 0.0001468062400817871, 0.00015649572014808655, 0.00016618520021438599, 0.00017587468028068542, 0.00018556416034698486, 0.0001952536404132843, 0.00020494312047958374, 0.00021463260054588318, 0.00022432208061218262, 0.00023401156067848206, 0.0002437010407447815, 0.00025339052081108093, 0.00026308000087738037, 0.0002727694809436798, 0.00028245896100997925, 0.0002921484410762787, 0.0003018379211425781]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 16.0, 12.0, 19.0, 38.0, 55.0, 138.0, 316.0, 837.0, 2704.0, 12402.0, 95218.0, 759548.0, 153990.0, 17957.0, 3542.0, 1015.0, 394.0, 164.0, 72.0, 43.0, 28.0, 19.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2538299560546875, -1.219573974609375, -1.1853179931640625, -1.15106201171875, -1.1168060302734375, -1.082550048828125, -1.0482940673828125, -1.0140380859375, -0.9797821044921875, -0.945526123046875, -0.9112701416015625, -0.87701416015625, -0.8427581787109375, -0.808502197265625, -0.7742462158203125, -0.739990234375, -0.7057342529296875, -0.671478271484375, -0.6372222900390625, -0.60296630859375, -0.5687103271484375, -0.534454345703125, -0.5001983642578125, -0.4659423828125, -0.4316864013671875, -0.397430419921875, -0.3631744384765625, -0.32891845703125, -0.2946624755859375, -0.260406494140625, -0.2261505126953125, -0.19189453125, -0.1576385498046875, -0.123382568359375, -0.0891265869140625, -0.05487060546875, -0.0206146240234375, 0.013641357421875, 0.0478973388671875, 0.0821533203125, 0.1164093017578125, 0.150665283203125, 0.1849212646484375, 0.21917724609375, 0.2534332275390625, 0.287689208984375, 0.3219451904296875, 0.356201171875, 0.3904571533203125, 0.424713134765625, 0.4589691162109375, 0.49322509765625, 0.5274810791015625, 0.561737060546875, 0.5959930419921875, 0.6302490234375, 0.6645050048828125, 0.698760986328125, 0.7330169677734375, 0.76727294921875, 0.8015289306640625, 0.835784912109375, 0.8700408935546875, 0.904296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 13.0, 15.0, 32.0, 20.0, 33.0, 49.0, 48.0, 62.0, 69.0, 82.0, 98.0, 89.0, 75.0, 63.0, 54.0, 46.0, 24.0, 33.0, 21.0, 21.0, 12.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8707733154296875, -0.843109130859375, -0.8154449462890625, -0.78778076171875, -0.7601165771484375, -0.732452392578125, -0.7047882080078125, -0.6771240234375, -0.6494598388671875, -0.621795654296875, -0.5941314697265625, -0.56646728515625, -0.5388031005859375, -0.511138916015625, -0.4834747314453125, -0.455810546875, -0.4281463623046875, -0.400482177734375, -0.3728179931640625, -0.34515380859375, -0.3174896240234375, -0.289825439453125, -0.2621612548828125, -0.2344970703125, -0.2068328857421875, -0.179168701171875, -0.1515045166015625, -0.12384033203125, -0.0961761474609375, -0.068511962890625, -0.0408477783203125, -0.01318359375, 0.0144805908203125, 0.042144775390625, 0.0698089599609375, 0.09747314453125, 0.1251373291015625, 0.152801513671875, 0.1804656982421875, 0.2081298828125, 0.2357940673828125, 0.263458251953125, 0.2911224365234375, 0.31878662109375, 0.3464508056640625, 0.374114990234375, 0.4017791748046875, 0.429443359375, 0.4571075439453125, 0.484771728515625, 0.5124359130859375, 0.54010009765625, 0.5677642822265625, 0.595428466796875, 0.6230926513671875, 0.6507568359375, 0.6784210205078125, 0.706085205078125, 0.7337493896484375, 0.76141357421875, 0.7890777587890625, 0.816741943359375, 0.8444061279296875, 0.8720703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 16.0, 13.0, 36.0, 54.0, 79.0, 128.0, 217.0, 157.0, 93.0, 51.0, 54.0, 34.0, 18.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.331497192382812, -12.849333763122559, -12.367170333862305, -11.885005950927734, -11.40284252166748, -10.920679092407227, -10.438515663146973, -9.956352233886719, -9.474187850952148, -8.992024421691895, -8.50986099243164, -8.02769660949707, -7.545533180236816, -7.0633697509765625, -6.581206321716309, -6.099042892456055, -5.616879463195801, -5.134716033935547, -4.652552127838135, -4.170388698577881, -3.688225030899048, -3.206061363220215, -2.723897933959961, -2.241734266281128, -1.759570598602295, -1.277406930923462, -0.7952433824539185, -0.313079833984375, 0.169083833694458, 0.651247501373291, 1.133410930633545, 1.615574598312378, 2.097738265991211, 2.579901933670044, 3.062065601348877, 3.544229030609131, 4.026392936706543, 4.508556365966797, 4.990719795227051, 5.472883224487305, 5.955047130584717, 6.437210559844971, 6.919374465942383, 7.401537895202637, 7.883701324462891, 8.365865707397461, 8.848028182983398, 9.330192565917969, 9.812355995178223, 10.294519424438477, 10.77668285369873, 11.258846282958984, 11.741010665893555, 12.223174095153809, 12.705337524414062, 13.187500953674316, 13.66966438293457, 14.151827812194824, 14.633991241455078, 15.116155624389648, 15.598319053649902, 16.080482482910156, 16.562644958496094, 17.044809341430664, 17.526973724365234]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 7.0, 12.0, 7.0, 14.0, 18.0, 26.0, 18.0, 27.0, 25.0, 27.0, 31.0, 39.0, 50.0, 46.0, 63.0, 76.0, 65.0, 54.0, 49.0, 29.0, 24.0, 22.0, 26.0, 25.0, 23.0, 22.0, 16.0, 24.0, 16.0, 13.0, 18.0, 5.0, 8.0, 6.0, 5.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.22567367553711, -9.891401290893555, -9.55712890625, -9.222856521606445, -8.88858413696289, -8.554311752319336, -8.220039367675781, -7.885766983032227, -7.551494598388672, -7.217222213745117, -6.8829498291015625, -6.548677444458008, -6.214405059814453, -5.880132675170898, -5.545860290527344, -5.211587905883789, -4.877315044403076, -4.5430426597595215, -4.208770275115967, -3.874497890472412, -3.5402255058288574, -3.2059531211853027, -2.871680498123169, -2.5374081134796143, -2.2031357288360596, -1.8688633441925049, -1.5345909595489502, -1.200318455696106, -0.8660460710525513, -0.5317736864089966, -0.19750118255615234, 0.13677120208740234, 0.47104358673095703, 0.8053159713745117, 1.1395883560180664, 1.4738608598709106, 1.8081332445144653, 2.1424055099487305, 2.4766781330108643, 2.810950517654419, 3.1452229022979736, 3.4794952869415283, 3.813767671585083, 4.148040294647217, 4.4823126792907715, 4.816585063934326, 5.150857448577881, 5.4851298332214355, 5.81940221786499, 6.153674602508545, 6.4879469871521, 6.822219371795654, 7.156491756439209, 7.490764141082764, 7.825037002563477, 8.159309387207031, 8.493581771850586, 8.82785415649414, 9.162126541137695, 9.49639892578125, 9.830671310424805, 10.16494369506836, 10.499216079711914, 10.833488464355469, 11.167760848999023]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 12.0, 21.0, 33.0, 40.0, 54.0, 72.0, 95.0, 135.0, 229.0, 314.0, 544.0, 942.0, 1663.0, 3237.0, 6765.0, 16306.0, 56966.0, 357909.0, 2612663.0, 973137.0, 117845.0, 25971.0, 9667.0, 4363.0, 2145.0, 1252.0, 722.0, 366.0, 259.0, 179.0, 87.0, 61.0, 54.0, 43.0, 33.0, 27.0, 16.0, 10.0, 12.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9733428955078125, -0.936920166015625, -0.9004974365234375, -0.86407470703125, -0.8276519775390625, -0.791229248046875, -0.7548065185546875, -0.7183837890625, -0.6819610595703125, -0.645538330078125, -0.6091156005859375, -0.57269287109375, -0.5362701416015625, -0.499847412109375, -0.4634246826171875, -0.427001953125, -0.3905792236328125, -0.354156494140625, -0.3177337646484375, -0.28131103515625, -0.2448883056640625, -0.208465576171875, -0.1720428466796875, -0.1356201171875, -0.0991973876953125, -0.062774658203125, -0.0263519287109375, 0.01007080078125, 0.0464935302734375, 0.082916259765625, 0.1193389892578125, 0.15576171875, 0.1921844482421875, 0.228607177734375, 0.2650299072265625, 0.30145263671875, 0.3378753662109375, 0.374298095703125, 0.4107208251953125, 0.4471435546875, 0.4835662841796875, 0.519989013671875, 0.5564117431640625, 0.59283447265625, 0.6292572021484375, 0.665679931640625, 0.7021026611328125, 0.738525390625, 0.7749481201171875, 0.811370849609375, 0.8477935791015625, 0.88421630859375, 0.9206390380859375, 0.957061767578125, 0.9934844970703125, 1.0299072265625, 1.0663299560546875, 1.102752685546875, 1.1391754150390625, 1.17559814453125, 1.2120208740234375, 1.248443603515625, 1.2848663330078125, 1.3212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 9.0, 6.0, 5.0, 10.0, 10.0, 11.0, 12.0, 19.0, 20.0, 31.0, 26.0, 31.0, 36.0, 43.0, 34.0, 41.0, 32.0, 31.0, 33.0, 47.0, 35.0, 53.0, 49.0, 39.0, 49.0, 32.0, 32.0, 25.0, 30.0, 20.0, 22.0, 20.0, 17.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.7482147216796875, -0.723968505859375, -0.6997222900390625, -0.67547607421875, -0.6512298583984375, -0.626983642578125, -0.6027374267578125, -0.5784912109375, -0.5542449951171875, -0.529998779296875, -0.5057525634765625, -0.48150634765625, -0.4572601318359375, -0.433013916015625, -0.4087677001953125, -0.384521484375, -0.3602752685546875, -0.336029052734375, -0.3117828369140625, -0.28753662109375, -0.2632904052734375, -0.239044189453125, -0.2147979736328125, -0.1905517578125, -0.1663055419921875, -0.142059326171875, -0.1178131103515625, -0.09356689453125, -0.0693206787109375, -0.045074462890625, -0.0208282470703125, 0.00341796875, 0.0276641845703125, 0.051910400390625, 0.0761566162109375, 0.10040283203125, 0.1246490478515625, 0.148895263671875, 0.1731414794921875, 0.1973876953125, 0.2216339111328125, 0.245880126953125, 0.2701263427734375, 0.29437255859375, 0.3186187744140625, 0.342864990234375, 0.3671112060546875, 0.391357421875, 0.4156036376953125, 0.439849853515625, 0.4640960693359375, 0.48834228515625, 0.5125885009765625, 0.536834716796875, 0.5610809326171875, 0.5853271484375, 0.6095733642578125, 0.633819580078125, 0.6580657958984375, 0.68231201171875, 0.7065582275390625, 0.730804443359375, 0.7550506591796875, 0.779296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 5.0, 2.0, 18.0, 23.0, 28.0, 44.0, 57.0, 125.0, 299.0, 693.0, 2051.0, 7706.0, 46313.0, 2200385.0, 1882987.0, 42966.0, 7302.0, 1976.0, 645.0, 290.0, 141.0, 74.0, 42.0, 28.0, 29.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.984375, -2.899078369140625, -2.81378173828125, -2.728485107421875, -2.6431884765625, -2.557891845703125, -2.47259521484375, -2.387298583984375, -2.302001953125, -2.216705322265625, -2.13140869140625, -2.046112060546875, -1.9608154296875, -1.875518798828125, -1.79022216796875, -1.704925537109375, -1.61962890625, -1.534332275390625, -1.44903564453125, -1.363739013671875, -1.2784423828125, -1.193145751953125, -1.10784912109375, -1.022552490234375, -0.937255859375, -0.851959228515625, -0.76666259765625, -0.681365966796875, -0.5960693359375, -0.510772705078125, -0.42547607421875, -0.340179443359375, -0.2548828125, -0.169586181640625, -0.08428955078125, 0.001007080078125, 0.0863037109375, 0.171600341796875, 0.25689697265625, 0.342193603515625, 0.427490234375, 0.512786865234375, 0.59808349609375, 0.683380126953125, 0.7686767578125, 0.853973388671875, 0.93927001953125, 1.024566650390625, 1.10986328125, 1.195159912109375, 1.28045654296875, 1.365753173828125, 1.4510498046875, 1.536346435546875, 1.62164306640625, 1.706939697265625, 1.792236328125, 1.877532958984375, 1.96282958984375, 2.048126220703125, 2.1334228515625, 2.218719482421875, 2.30401611328125, 2.389312744140625, 2.474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 3.0, 10.0, 26.0, 17.0, 23.0, 47.0, 68.0, 103.0, 212.0, 469.0, 979.0, 1059.0, 517.0, 218.0, 119.0, 63.0, 45.0, 23.0, 22.0, 8.0, 11.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9129791259765625, -1.836700439453125, -1.7604217529296875, -1.68414306640625, -1.6078643798828125, -1.531585693359375, -1.4553070068359375, -1.3790283203125, -1.3027496337890625, -1.226470947265625, -1.1501922607421875, -1.07391357421875, -0.9976348876953125, -0.921356201171875, -0.8450775146484375, -0.768798828125, -0.6925201416015625, -0.616241455078125, -0.5399627685546875, -0.46368408203125, -0.3874053955078125, -0.311126708984375, -0.2348480224609375, -0.1585693359375, -0.0822906494140625, -0.006011962890625, 0.0702667236328125, 0.14654541015625, 0.2228240966796875, 0.299102783203125, 0.3753814697265625, 0.45166015625, 0.5279388427734375, 0.604217529296875, 0.6804962158203125, 0.75677490234375, 0.8330535888671875, 0.909332275390625, 0.9856109619140625, 1.0618896484375, 1.1381683349609375, 1.214447021484375, 1.2907257080078125, 1.36700439453125, 1.4432830810546875, 1.519561767578125, 1.5958404541015625, 1.672119140625, 1.7483978271484375, 1.824676513671875, 1.9009552001953125, 1.97723388671875, 2.0535125732421875, 2.129791259765625, 2.2060699462890625, 2.2823486328125, 2.3586273193359375, 2.434906005859375, 2.5111846923828125, 2.58746337890625, 2.6637420654296875, 2.740020751953125, 2.8162994384765625, 2.892578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 15.0, 22.0, 47.0, 85.0, 167.0, 257.0, 192.0, 93.0, 62.0, 24.0, 13.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.713455200195312, -20.100908279418945, -19.48836326599121, -18.875816345214844, -18.26327133178711, -17.650724411010742, -17.038177490234375, -16.42563247680664, -15.813085556030273, -15.200539588928223, -14.587993621826172, -13.975446701049805, -13.362900733947754, -12.750354766845703, -12.137808799743652, -11.525262832641602, -10.91271686553955, -10.3001708984375, -9.68762493133545, -9.075078964233398, -8.462532043457031, -7.8499860763549805, -7.23744010925293, -6.624893665313721, -6.01234769821167, -5.399801731109619, -4.78725528717041, -4.174709320068359, -3.5621631145477295, -2.9496169090270996, -2.337070941925049, -1.7245244979858398, -1.111978530883789, -0.49943238496780396, 0.11311376094818115, 0.7256598472595215, 1.3382060527801514, 1.9507522583007812, 2.563298225402832, 3.175844669342041, 3.788390636444092, 4.400936603546143, 5.013483047485352, 5.626029014587402, 6.238574981689453, 6.851121425628662, 7.463667392730713, 8.076213836669922, 8.688759803771973, 9.301305770874023, 9.913851737976074, 10.526397705078125, 11.138944625854492, 11.751490592956543, 12.364036560058594, 12.976583480834961, 13.589128494262695, 14.201674461364746, 14.814220428466797, 15.426767349243164, 16.0393123626709, 16.651859283447266, 17.264404296875, 17.876951217651367, 18.489498138427734]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 13.0, 17.0, 14.0, 13.0, 18.0, 19.0, 24.0, 32.0, 26.0, 45.0, 44.0, 42.0, 49.0, 52.0, 45.0, 57.0, 42.0, 66.0, 35.0, 44.0, 46.0, 31.0, 43.0, 29.0, 31.0, 24.0, 14.0, 16.0, 11.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.31397819519043, -9.049446105957031, -8.784913063049316, -8.520380973815918, -8.255847930908203, -7.991315841674805, -7.726783275604248, -7.462250709533691, -7.197718143463135, -6.933185577392578, -6.6686530113220215, -6.404120445251465, -6.139588356018066, -5.875055313110352, -5.610523223876953, -5.3459906578063965, -5.08145809173584, -4.816925525665283, -4.552392959594727, -4.28786039352417, -4.023327827453613, -3.7587954998016357, -3.494263172149658, -3.2297306060791016, -2.965198040008545, -2.7006654739379883, -2.4361329078674316, -2.171600580215454, -1.9070680141448975, -1.6425354480743408, -1.3780030012130737, -1.1134705543518066, -0.8489370346069336, -0.5844045281410217, -0.31987202167510986, -0.055339515209198, 0.20919299125671387, 0.4737255573272705, 0.7382580041885376, 1.0027904510498047, 1.2673230171203613, 1.531855583190918, 1.796388030052185, 2.060920476913452, 2.325453042984009, 2.5899856090545654, 2.854517936706543, 3.1190505027770996, 3.3835830688476562, 3.648115634918213, 3.9126482009887695, 4.177180767059326, 4.441713333129883, 4.706245422363281, 4.970777988433838, 5.2353105545043945, 5.499843120574951, 5.764375686645508, 6.0289082527160645, 6.293440818786621, 6.5579729080200195, 6.822505950927734, 7.087038040161133, 7.3515706062316895, 7.616103172302246]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 18.0, 23.0, 37.0, 54.0, 76.0, 114.0, 175.0, 206.0, 333.0, 520.0, 805.0, 1312.0, 2234.0, 3750.0, 6773.0, 12748.0, 25508.0, 54246.0, 122987.0, 276508.0, 291662.0, 132540.0, 57889.0, 27259.0, 13629.0, 7072.0, 3866.0, 2334.0, 1352.0, 850.0, 534.0, 375.0, 231.0, 168.0, 107.0, 77.0, 41.0, 36.0, 23.0, 22.0, 10.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134124755859375, -1.09637451171875, -1.058624267578125, -1.0208740234375, -0.983123779296875, -0.94537353515625, -0.907623291015625, -0.869873046875, -0.832122802734375, -0.79437255859375, -0.756622314453125, -0.7188720703125, -0.681121826171875, -0.64337158203125, -0.605621337890625, -0.56787109375, -0.530120849609375, -0.49237060546875, -0.454620361328125, -0.4168701171875, -0.379119873046875, -0.34136962890625, -0.303619384765625, -0.265869140625, -0.228118896484375, -0.19036865234375, -0.152618408203125, -0.1148681640625, -0.077117919921875, -0.03936767578125, -0.001617431640625, 0.0361328125, 0.073883056640625, 0.11163330078125, 0.149383544921875, 0.1871337890625, 0.224884033203125, 0.26263427734375, 0.300384521484375, 0.338134765625, 0.375885009765625, 0.41363525390625, 0.451385498046875, 0.4891357421875, 0.526885986328125, 0.56463623046875, 0.602386474609375, 0.64013671875, 0.677886962890625, 0.71563720703125, 0.753387451171875, 0.7911376953125, 0.828887939453125, 0.86663818359375, 0.904388427734375, 0.942138671875, 0.979888916015625, 1.01763916015625, 1.055389404296875, 1.0931396484375, 1.130889892578125, 1.16864013671875, 1.206390380859375, 1.244140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 15.0, 10.0, 15.0, 13.0, 11.0, 15.0, 15.0, 32.0, 32.0, 21.0, 29.0, 36.0, 29.0, 40.0, 35.0, 35.0, 38.0, 51.0, 42.0, 37.0, 34.0, 48.0, 37.0, 43.0, 35.0, 30.0, 27.0, 15.0, 26.0, 22.0, 24.0, 23.0, 15.0, 11.0, 11.0, 6.0, 7.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.71044921875, -0.68707275390625, -0.6636962890625, -0.64031982421875, -0.616943359375, -0.59356689453125, -0.5701904296875, -0.54681396484375, -0.5234375, -0.50006103515625, -0.4766845703125, -0.45330810546875, -0.429931640625, -0.40655517578125, -0.3831787109375, -0.35980224609375, -0.33642578125, -0.31304931640625, -0.2896728515625, -0.26629638671875, -0.242919921875, -0.21954345703125, -0.1961669921875, -0.17279052734375, -0.1494140625, -0.12603759765625, -0.1026611328125, -0.07928466796875, -0.055908203125, -0.03253173828125, -0.0091552734375, 0.01422119140625, 0.03759765625, 0.06097412109375, 0.0843505859375, 0.10772705078125, 0.131103515625, 0.15447998046875, 0.1778564453125, 0.20123291015625, 0.224609375, 0.24798583984375, 0.2713623046875, 0.29473876953125, 0.318115234375, 0.34149169921875, 0.3648681640625, 0.38824462890625, 0.41162109375, 0.43499755859375, 0.4583740234375, 0.48175048828125, 0.505126953125, 0.52850341796875, 0.5518798828125, 0.57525634765625, 0.5986328125, 0.62200927734375, 0.6453857421875, 0.66876220703125, 0.692138671875, 0.71551513671875, 0.7388916015625, 0.76226806640625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 7.0, 9.0, 10.0, 17.0, 33.0, 38.0, 40.0, 75.0, 127.0, 146.0, 224.0, 432.0, 711.0, 1320.0, 2794.0, 7078.0, 24227.0, 114454.0, 689434.0, 160329.0, 31500.0, 8855.0, 3260.0, 1444.0, 759.0, 432.0, 266.0, 160.0, 117.0, 76.0, 40.0, 35.0, 25.0, 19.0, 19.0, 7.0, 6.0, 5.0, 6.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.326171875, -2.2589263916015625, -2.191680908203125, -2.1244354248046875, -2.05718994140625, -1.9899444580078125, -1.922698974609375, -1.8554534912109375, -1.7882080078125, -1.7209625244140625, -1.653717041015625, -1.5864715576171875, -1.51922607421875, -1.4519805908203125, -1.384735107421875, -1.3174896240234375, -1.250244140625, -1.1829986572265625, -1.115753173828125, -1.0485076904296875, -0.98126220703125, -0.9140167236328125, -0.846771240234375, -0.7795257568359375, -0.7122802734375, -0.6450347900390625, -0.577789306640625, -0.5105438232421875, -0.44329833984375, -0.3760528564453125, -0.308807373046875, -0.2415618896484375, -0.17431640625, -0.1070709228515625, -0.039825439453125, 0.0274200439453125, 0.09466552734375, 0.1619110107421875, 0.229156494140625, 0.2964019775390625, 0.3636474609375, 0.4308929443359375, 0.498138427734375, 0.5653839111328125, 0.63262939453125, 0.6998748779296875, 0.767120361328125, 0.8343658447265625, 0.901611328125, 0.9688568115234375, 1.036102294921875, 1.1033477783203125, 1.17059326171875, 1.2378387451171875, 1.305084228515625, 1.3723297119140625, 1.4395751953125, 1.5068206787109375, 1.574066162109375, 1.6413116455078125, 1.70855712890625, 1.7758026123046875, 1.843048095703125, 1.9102935791015625, 1.9775390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 12.0, 9.0, 24.0, 30.0, 29.0, 41.0, 50.0, 53.0, 53.0, 59.0, 62.0, 66.0, 62.0, 53.0, 52.0, 48.0, 56.0, 46.0, 30.0, 30.0, 32.0, 19.0, 13.0, 15.0, 7.0, 1.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.2265625, -4.115997314453125, -4.00543212890625, -3.894866943359375, -3.7843017578125, -3.673736572265625, -3.56317138671875, -3.452606201171875, -3.342041015625, -3.231475830078125, -3.12091064453125, -3.010345458984375, -2.8997802734375, -2.789215087890625, -2.67864990234375, -2.568084716796875, -2.45751953125, -2.346954345703125, -2.23638916015625, -2.125823974609375, -2.0152587890625, -1.904693603515625, -1.79412841796875, -1.683563232421875, -1.572998046875, -1.462432861328125, -1.35186767578125, -1.241302490234375, -1.1307373046875, -1.020172119140625, -0.90960693359375, -0.799041748046875, -0.6884765625, -0.577911376953125, -0.46734619140625, -0.356781005859375, -0.2462158203125, -0.135650634765625, -0.02508544921875, 0.085479736328125, 0.196044921875, 0.306610107421875, 0.41717529296875, 0.527740478515625, 0.6383056640625, 0.748870849609375, 0.85943603515625, 0.970001220703125, 1.08056640625, 1.191131591796875, 1.30169677734375, 1.412261962890625, 1.5228271484375, 1.633392333984375, 1.74395751953125, 1.854522705078125, 1.965087890625, 2.075653076171875, 2.18621826171875, 2.296783447265625, 2.4073486328125, 2.517913818359375, 2.62847900390625, 2.739044189453125, 2.849609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 9.0, 11.0, 10.0, 16.0, 26.0, 46.0, 65.0, 108.0, 181.0, 341.0, 703.0, 1593.0, 4422.0, 15898.0, 81536.0, 753646.0, 153973.0, 25429.0, 6518.0, 2120.0, 904.0, 420.0, 204.0, 120.0, 70.0, 63.0, 48.0, 23.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6773529052734375, -0.654510498046875, -0.6316680908203125, -0.60882568359375, -0.5859832763671875, -0.563140869140625, -0.5402984619140625, -0.5174560546875, -0.4946136474609375, -0.471771240234375, -0.4489288330078125, -0.42608642578125, -0.4032440185546875, -0.380401611328125, -0.3575592041015625, -0.334716796875, -0.3118743896484375, -0.289031982421875, -0.2661895751953125, -0.24334716796875, -0.2205047607421875, -0.197662353515625, -0.1748199462890625, -0.1519775390625, -0.1291351318359375, -0.106292724609375, -0.0834503173828125, -0.06060791015625, -0.0377655029296875, -0.014923095703125, 0.0079193115234375, 0.03076171875, 0.0536041259765625, 0.076446533203125, 0.0992889404296875, 0.12213134765625, 0.1449737548828125, 0.167816162109375, 0.1906585693359375, 0.2135009765625, 0.2363433837890625, 0.259185791015625, 0.2820281982421875, 0.30487060546875, 0.3277130126953125, 0.350555419921875, 0.3733978271484375, 0.396240234375, 0.4190826416015625, 0.441925048828125, 0.4647674560546875, 0.48760986328125, 0.5104522705078125, 0.533294677734375, 0.5561370849609375, 0.5789794921875, 0.6018218994140625, 0.624664306640625, 0.6475067138671875, 0.67034912109375, 0.6931915283203125, 0.716033935546875, 0.7388763427734375, 0.76171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 9.0, 2.0, 8.0, 16.0, 12.0, 17.0, 22.0, 31.0, 35.0, 61.0, 40.0, 66.0, 95.0, 123.0, 111.0, 65.0, 58.0, 44.0, 39.0, 24.0, 21.0, 20.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014162063598632812, -0.000136692076921463, -0.0001317635178565979, -0.0001268349587917328, -0.00012190639972686768, -0.00011697784066200256, -0.00011204928159713745, -0.00010712072253227234, -0.00010219216346740723, -9.726360440254211e-05, -9.2335045337677e-05, -8.740648627281189e-05, -8.247792720794678e-05, -7.754936814308167e-05, -7.262080907821655e-05, -6.769225001335144e-05, -6.276369094848633e-05, -5.7835131883621216e-05, -5.2906572818756104e-05, -4.797801375389099e-05, -4.304945468902588e-05, -3.8120895624160767e-05, -3.3192336559295654e-05, -2.8263777494430542e-05, -2.333521842956543e-05, -1.8406659364700317e-05, -1.3478100299835205e-05, -8.549541234970093e-06, -3.6209821701049805e-06, 1.3075768947601318e-06, 6.236135959625244e-06, 1.1164695024490356e-05, 1.609325408935547e-05, 2.102181315422058e-05, 2.5950372219085693e-05, 3.0878931283950806e-05, 3.580749034881592e-05, 4.073604941368103e-05, 4.566460847854614e-05, 5.0593167543411255e-05, 5.552172660827637e-05, 6.045028567314148e-05, 6.537884473800659e-05, 7.03074038028717e-05, 7.523596286773682e-05, 8.016452193260193e-05, 8.509308099746704e-05, 9.002164006233215e-05, 9.495019912719727e-05, 9.987875819206238e-05, 0.00010480731725692749, 0.0001097358763217926, 0.00011466443538665771, 0.00011959299445152283, 0.00012452155351638794, 0.00012945011258125305, 0.00013437867164611816, 0.00013930723071098328, 0.0001442357897758484, 0.0001491643488407135, 0.0001540929079055786, 0.00015902146697044373, 0.00016395002603530884, 0.00016887858510017395, 0.00017380714416503906]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 7.0, 5.0, 10.0, 18.0, 20.0, 43.0, 56.0, 123.0, 257.0, 411.0, 868.0, 2144.0, 6215.0, 26524.0, 232395.0, 715770.0, 49013.0, 9515.0, 2799.0, 1137.0, 541.0, 279.0, 153.0, 84.0, 48.0, 30.0, 25.0, 20.0, 6.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7664260864257812, -0.7418365478515625, -0.7172470092773438, -0.692657470703125, -0.6680679321289062, -0.6434783935546875, -0.6188888549804688, -0.59429931640625, -0.5697097778320312, -0.5451202392578125, -0.5205307006835938, -0.495941162109375, -0.47135162353515625, -0.4467620849609375, -0.42217254638671875, -0.3975830078125, -0.37299346923828125, -0.3484039306640625, -0.32381439208984375, -0.299224853515625, -0.27463531494140625, -0.2500457763671875, -0.22545623779296875, -0.20086669921875, -0.17627716064453125, -0.1516876220703125, -0.12709808349609375, -0.102508544921875, -0.07791900634765625, -0.0533294677734375, -0.02873992919921875, -0.004150390625, 0.02043914794921875, 0.0450286865234375, 0.06961822509765625, 0.094207763671875, 0.11879730224609375, 0.1433868408203125, 0.16797637939453125, 0.19256591796875, 0.21715545654296875, 0.2417449951171875, 0.26633453369140625, 0.290924072265625, 0.31551361083984375, 0.3401031494140625, 0.36469268798828125, 0.3892822265625, 0.41387176513671875, 0.4384613037109375, 0.46305084228515625, 0.487640380859375, 0.5122299194335938, 0.5368194580078125, 0.5614089965820312, 0.58599853515625, 0.6105880737304688, 0.6351776123046875, 0.6597671508789062, 0.684356689453125, 0.7089462280273438, 0.7335357666015625, 0.7581253051757812, 0.78271484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 15.0, 13.0, 37.0, 57.0, 85.0, 140.0, 180.0, 148.0, 105.0, 71.0, 41.0, 35.0, 22.0, 19.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1321258544921875, -1.095306396484375, -1.0584869384765625, -1.02166748046875, -0.9848480224609375, -0.948028564453125, -0.9112091064453125, -0.8743896484375, -0.8375701904296875, -0.800750732421875, -0.7639312744140625, -0.72711181640625, -0.6902923583984375, -0.653472900390625, -0.6166534423828125, -0.579833984375, -0.5430145263671875, -0.506195068359375, -0.4693756103515625, -0.43255615234375, -0.3957366943359375, -0.358917236328125, -0.3220977783203125, -0.2852783203125, -0.2484588623046875, -0.211639404296875, -0.1748199462890625, -0.13800048828125, -0.1011810302734375, -0.064361572265625, -0.0275421142578125, 0.00927734375, 0.0460968017578125, 0.082916259765625, 0.1197357177734375, 0.15655517578125, 0.1933746337890625, 0.230194091796875, 0.2670135498046875, 0.3038330078125, 0.3406524658203125, 0.377471923828125, 0.4142913818359375, 0.45111083984375, 0.4879302978515625, 0.524749755859375, 0.5615692138671875, 0.598388671875, 0.6352081298828125, 0.672027587890625, 0.7088470458984375, 0.74566650390625, 0.7824859619140625, 0.819305419921875, 0.8561248779296875, 0.8929443359375, 0.9297637939453125, 0.966583251953125, 1.0034027099609375, 1.04022216796875, 1.0770416259765625, 1.113861083984375, 1.1506805419921875, 1.1875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 16.0, 21.0, 30.0, 55.0, 87.0, 148.0, 264.0, 126.0, 83.0, 54.0, 28.0, 22.0, 21.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-16.689308166503906, -16.253013610839844, -15.816718101501465, -15.380422592163086, -14.944127082824707, -14.507831573486328, -14.071537017822266, -13.635241508483887, -13.198945999145508, -12.762650489807129, -12.326355934143066, -11.890060424804688, -11.453764915466309, -11.01746940612793, -10.581174850463867, -10.144879341125488, -9.70858383178711, -9.27228832244873, -8.835993766784668, -8.399698257446289, -7.96340274810791, -7.5271077156066895, -7.090812683105469, -6.65451717376709, -6.218222618103027, -5.781927585601807, -5.345632076263428, -4.909337043762207, -4.473041534423828, -4.036746501922607, -3.6004512310028076, -3.164155960083008, -2.727860450744629, -2.291565179824829, -1.8552699089050293, -1.418974757194519, -0.9826794862747192, -0.546384334564209, -0.11008906364440918, 0.3262062072753906, 0.7625014781951904, 1.1987967491149902, 1.63509202003479, 2.07138729095459, 2.5076823234558105, 2.9439775943756104, 3.38027286529541, 3.81656813621521, 4.25286340713501, 4.6891584396362305, 5.125453948974609, 5.56174898147583, 5.998044490814209, 6.43433952331543, 6.870635032653809, 7.306930065155029, 7.74322509765625, 8.179520606994629, 8.615815162658691, 9.05211067199707, 9.48840618133545, 9.924701690673828, 10.36099624633789, 10.79729175567627, 11.233587265014648]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 10.0, 10.0, 11.0, 15.0, 31.0, 15.0, 28.0, 23.0, 23.0, 36.0, 42.0, 45.0, 54.0, 60.0, 116.0, 93.0, 49.0, 44.0, 39.0, 30.0, 27.0, 28.0, 31.0, 22.0, 13.0, 8.0, 12.0, 14.0, 14.0, 8.0, 11.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-13.936079025268555, -13.544151306152344, -13.152223587036133, -12.760295867919922, -12.368367195129395, -11.976439476013184, -11.584511756896973, -11.192584037780762, -10.800655364990234, -10.408727645874023, -10.016799926757812, -9.624872207641602, -9.232943534851074, -8.841015815734863, -8.449088096618652, -8.057160377502441, -7.6652326583862305, -7.2733049392700195, -6.88137674331665, -6.4894490242004395, -6.09752082824707, -5.705593109130859, -5.313665390014648, -4.9217376708984375, -4.529809474945068, -4.137881755828857, -3.7459535598754883, -3.3540258407592773, -2.9620978832244873, -2.5701699256896973, -2.1782422065734863, -1.7863142490386963, -1.3943853378295898, -1.0024573802947998, -0.6105295419692993, -0.21860170364379883, 0.1733262538909912, 0.5652542114257812, 0.9571819305419922, 1.3491098880767822, 1.7410378456115723, 2.1329658031463623, 2.5248937606811523, 2.9168214797973633, 3.3087494373321533, 3.7006773948669434, 4.092605113983154, 4.484533309936523, 4.876461029052734, 5.268388748168945, 5.6603169441223145, 6.052244663238525, 6.4441728591918945, 6.8361005783081055, 7.228028297424316, 7.619956016540527, 8.011884689331055, 8.403812408447266, 8.795740127563477, 9.187667846679688, 9.579596519470215, 9.971524238586426, 10.363451957702637, 10.755379676818848, 11.147307395935059]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 18.0, 14.0, 27.0, 27.0, 52.0, 73.0, 123.0, 190.0, 335.0, 597.0, 1075.0, 2230.0, 5053.0, 14265.0, 58412.0, 451304.0, 2717467.0, 816972.0, 94100.0, 19588.0, 6541.0, 2811.0, 1307.0, 659.0, 368.0, 227.0, 137.0, 82.0, 56.0, 57.0, 34.0, 20.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.111328125, -1.073822021484375, -1.03631591796875, -0.998809814453125, -0.9613037109375, -0.923797607421875, -0.88629150390625, -0.848785400390625, -0.811279296875, -0.773773193359375, -0.73626708984375, -0.698760986328125, -0.6612548828125, -0.623748779296875, -0.58624267578125, -0.548736572265625, -0.51123046875, -0.473724365234375, -0.43621826171875, -0.398712158203125, -0.3612060546875, -0.323699951171875, -0.28619384765625, -0.248687744140625, -0.211181640625, -0.173675537109375, -0.13616943359375, -0.098663330078125, -0.0611572265625, -0.023651123046875, 0.01385498046875, 0.051361083984375, 0.0888671875, 0.126373291015625, 0.16387939453125, 0.201385498046875, 0.2388916015625, 0.276397705078125, 0.31390380859375, 0.351409912109375, 0.388916015625, 0.426422119140625, 0.46392822265625, 0.501434326171875, 0.5389404296875, 0.576446533203125, 0.61395263671875, 0.651458740234375, 0.68896484375, 0.726470947265625, 0.76397705078125, 0.801483154296875, 0.8389892578125, 0.876495361328125, 0.91400146484375, 0.951507568359375, 0.989013671875, 1.026519775390625, 1.06402587890625, 1.101531982421875, 1.1390380859375, 1.176544189453125, 1.21405029296875, 1.251556396484375, 1.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 14.0, 11.0, 14.0, 13.0, 17.0, 22.0, 17.0, 25.0, 33.0, 24.0, 34.0, 36.0, 45.0, 40.0, 28.0, 47.0, 52.0, 53.0, 40.0, 33.0, 37.0, 39.0, 39.0, 34.0, 39.0, 35.0, 24.0, 26.0, 23.0, 25.0, 17.0, 9.0, 7.0, 5.0, 7.0, 7.0, 3.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.814453125, -0.7899246215820312, -0.7653961181640625, -0.7408676147460938, -0.716339111328125, -0.6918106079101562, -0.6672821044921875, -0.6427536010742188, -0.61822509765625, -0.5936965942382812, -0.5691680908203125, -0.5446395874023438, -0.520111083984375, -0.49558258056640625, -0.4710540771484375, -0.44652557373046875, -0.4219970703125, -0.39746856689453125, -0.3729400634765625, -0.34841156005859375, -0.323883056640625, -0.29935455322265625, -0.2748260498046875, -0.25029754638671875, -0.22576904296875, -0.20124053955078125, -0.1767120361328125, -0.15218353271484375, -0.127655029296875, -0.10312652587890625, -0.0785980224609375, -0.05406951904296875, -0.029541015625, -0.00501251220703125, 0.0195159912109375, 0.04404449462890625, 0.068572998046875, 0.09310150146484375, 0.1176300048828125, 0.14215850830078125, 0.16668701171875, 0.19121551513671875, 0.2157440185546875, 0.24027252197265625, 0.264801025390625, 0.28932952880859375, 0.3138580322265625, 0.33838653564453125, 0.3629150390625, 0.38744354248046875, 0.4119720458984375, 0.43650054931640625, 0.461029052734375, 0.48555755615234375, 0.5100860595703125, 0.5346145629882812, 0.55914306640625, 0.5836715698242188, 0.6082000732421875, 0.6327285766601562, 0.657257080078125, 0.6817855834960938, 0.7063140869140625, 0.7308425903320312, 0.75537109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 2.0, 12.0, 7.0, 12.0, 29.0, 34.0, 42.0, 79.0, 161.0, 294.0, 664.0, 2158.0, 7947.0, 48523.0, 2216296.0, 1861102.0, 45454.0, 7820.0, 2184.0, 734.0, 319.0, 137.0, 85.0, 46.0, 45.0, 25.0, 21.0, 17.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.484375, -2.4090576171875, -2.333740234375, -2.2584228515625, -2.18310546875, -2.1077880859375, -2.032470703125, -1.9571533203125, -1.8818359375, -1.8065185546875, -1.731201171875, -1.6558837890625, -1.58056640625, -1.5052490234375, -1.429931640625, -1.3546142578125, -1.279296875, -1.2039794921875, -1.128662109375, -1.0533447265625, -0.97802734375, -0.9027099609375, -0.827392578125, -0.7520751953125, -0.6767578125, -0.6014404296875, -0.526123046875, -0.4508056640625, -0.37548828125, -0.3001708984375, -0.224853515625, -0.1495361328125, -0.07421875, 0.0010986328125, 0.076416015625, 0.1517333984375, 0.22705078125, 0.3023681640625, 0.377685546875, 0.4530029296875, 0.5283203125, 0.6036376953125, 0.678955078125, 0.7542724609375, 0.82958984375, 0.9049072265625, 0.980224609375, 1.0555419921875, 1.130859375, 1.2061767578125, 1.281494140625, 1.3568115234375, 1.43212890625, 1.5074462890625, 1.582763671875, 1.6580810546875, 1.7333984375, 1.8087158203125, 1.884033203125, 1.9593505859375, 2.03466796875, 2.1099853515625, 2.185302734375, 2.2606201171875, 2.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 3.0, 6.0, 6.0, 11.0, 18.0, 24.0, 39.0, 57.0, 96.0, 144.0, 281.0, 598.0, 1003.0, 839.0, 392.0, 218.0, 119.0, 74.0, 35.0, 22.0, 23.0, 21.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.475738525390625, -2.40655517578125, -2.337371826171875, -2.2681884765625, -2.199005126953125, -2.12982177734375, -2.060638427734375, -1.991455078125, -1.922271728515625, -1.85308837890625, -1.783905029296875, -1.7147216796875, -1.645538330078125, -1.57635498046875, -1.507171630859375, -1.43798828125, -1.368804931640625, -1.29962158203125, -1.230438232421875, -1.1612548828125, -1.092071533203125, -1.02288818359375, -0.953704833984375, -0.884521484375, -0.815338134765625, -0.74615478515625, -0.676971435546875, -0.6077880859375, -0.538604736328125, -0.46942138671875, -0.400238037109375, -0.3310546875, -0.261871337890625, -0.19268798828125, -0.123504638671875, -0.0543212890625, 0.014862060546875, 0.08404541015625, 0.153228759765625, 0.222412109375, 0.291595458984375, 0.36077880859375, 0.429962158203125, 0.4991455078125, 0.568328857421875, 0.63751220703125, 0.706695556640625, 0.77587890625, 0.845062255859375, 0.91424560546875, 0.983428955078125, 1.0526123046875, 1.121795654296875, 1.19097900390625, 1.260162353515625, 1.329345703125, 1.398529052734375, 1.46771240234375, 1.536895751953125, 1.6060791015625, 1.675262451171875, 1.74444580078125, 1.813629150390625, 1.8828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 43.0, 99.0, 284.0, 321.0, 158.0, 40.0, 21.0, 9.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.12636947631836, -35.36076354980469, -34.59516143798828, -33.829559326171875, -33.0639533996582, -32.29834747314453, -31.532745361328125, -30.767141342163086, -30.001537322998047, -29.235933303833008, -28.47032928466797, -27.70472526550293, -26.93912124633789, -26.17351722717285, -25.407913208007812, -24.642309188842773, -23.876705169677734, -23.111101150512695, -22.345497131347656, -21.579893112182617, -20.814289093017578, -20.04868507385254, -19.2830810546875, -18.51747703552246, -17.751873016357422, -16.986268997192383, -16.220664978027344, -15.455060958862305, -14.689456939697266, -13.923852920532227, -13.158248901367188, -12.392644882202148, -11.62704086303711, -10.86143684387207, -10.095832824707031, -9.330228805541992, -8.564624786376953, -7.799020767211914, -7.033416748046875, -6.267812728881836, -5.502208709716797, -4.736604690551758, -3.9710006713867188, -3.2053966522216797, -2.4397926330566406, -1.6741886138916016, -0.9085845947265625, -0.14298057556152344, 0.6226234436035156, 1.3882274627685547, 2.1538314819335938, 2.919435501098633, 3.685039520263672, 4.450643539428711, 5.21624755859375, 5.981851577758789, 6.747455596923828, 7.513059616088867, 8.278663635253906, 9.044267654418945, 9.809871673583984, 10.575475692749023, 11.341079711914062, 12.106683731079102, 12.87228775024414]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 15.0, 11.0, 11.0, 16.0, 18.0, 24.0, 18.0, 28.0, 37.0, 39.0, 48.0, 31.0, 41.0, 48.0, 51.0, 51.0, 54.0, 45.0, 43.0, 38.0, 44.0, 31.0, 31.0, 34.0, 20.0, 15.0, 25.0, 22.0, 10.0, 7.0, 14.0, 10.0, 9.0, 7.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.457266807556152, -6.251025199890137, -6.044783592224121, -5.838541507720947, -5.632299900054932, -5.426058292388916, -5.219816207885742, -5.013574600219727, -4.807332992553711, -4.601091384887695, -4.39484977722168, -4.188607692718506, -3.9823660850524902, -3.7761244773864746, -3.56988263130188, -3.363640785217285, -3.1573991775512695, -2.951157569885254, -2.744915723800659, -2.5386738777160645, -2.332432270050049, -2.126190662384033, -1.9199488162994385, -1.7137070894241333, -1.5074653625488281, -1.301223635673523, -1.0949819087982178, -0.8887401819229126, -0.6824984550476074, -0.47625672817230225, -0.27001500129699707, -0.0637732744216919, 0.14246892929077148, 0.34871065616607666, 0.5549523830413818, 0.761194109916687, 0.9674358367919922, 1.1736775636672974, 1.3799192905426025, 1.5861610174179077, 1.792402744293213, 1.998644471168518, 2.2048861980438232, 2.411128044128418, 2.6173696517944336, 2.823611259460449, 3.029853105545044, 3.2360949516296387, 3.4423365592956543, 3.64857816696167, 3.8548200130462646, 4.061061859130859, 4.267303466796875, 4.473545074462891, 4.679786682128906, 4.88602876663208, 5.092270374298096, 5.298511981964111, 5.504754066467285, 5.710995674133301, 5.917237281799316, 6.123478889465332, 6.329720497131348, 6.5359625816345215, 6.742204189300537]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 13.0, 20.0, 26.0, 32.0, 61.0, 102.0, 111.0, 174.0, 250.0, 370.0, 531.0, 898.0, 1415.0, 2227.0, 3727.0, 6667.0, 12690.0, 27454.0, 67152.0, 187711.0, 420290.0, 190945.0, 68009.0, 28087.0, 12918.0, 6560.0, 3861.0, 2214.0, 1353.0, 848.0, 615.0, 367.0, 266.0, 198.0, 120.0, 82.0, 66.0, 32.0, 35.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.5431671142578125, -1.492584228515625, -1.4420013427734375, -1.39141845703125, -1.3408355712890625, -1.290252685546875, -1.2396697998046875, -1.1890869140625, -1.1385040283203125, -1.087921142578125, -1.0373382568359375, -0.98675537109375, -0.9361724853515625, -0.885589599609375, -0.8350067138671875, -0.784423828125, -0.7338409423828125, -0.683258056640625, -0.6326751708984375, -0.58209228515625, -0.5315093994140625, -0.480926513671875, -0.4303436279296875, -0.3797607421875, -0.3291778564453125, -0.278594970703125, -0.2280120849609375, -0.17742919921875, -0.1268463134765625, -0.076263427734375, -0.0256805419921875, 0.02490234375, 0.0754852294921875, 0.126068115234375, 0.1766510009765625, 0.22723388671875, 0.2778167724609375, 0.328399658203125, 0.3789825439453125, 0.4295654296875, 0.4801483154296875, 0.530731201171875, 0.5813140869140625, 0.63189697265625, 0.6824798583984375, 0.733062744140625, 0.7836456298828125, 0.834228515625, 0.8848114013671875, 0.935394287109375, 0.9859771728515625, 1.03656005859375, 1.0871429443359375, 1.137725830078125, 1.1883087158203125, 1.2388916015625, 1.2894744873046875, 1.340057373046875, 1.3906402587890625, 1.44122314453125, 1.4918060302734375, 1.542388916015625, 1.5929718017578125, 1.6435546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 8.0, 5.0, 8.0, 15.0, 13.0, 20.0, 17.0, 25.0, 22.0, 34.0, 29.0, 33.0, 39.0, 30.0, 34.0, 55.0, 50.0, 39.0, 53.0, 45.0, 38.0, 37.0, 33.0, 40.0, 36.0, 35.0, 35.0, 27.0, 27.0, 22.0, 20.0, 21.0, 11.0, 7.0, 6.0, 7.0, 1.0, 8.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7744140625, -0.7486953735351562, -0.7229766845703125, -0.6972579956054688, -0.671539306640625, -0.6458206176757812, -0.6201019287109375, -0.5943832397460938, -0.56866455078125, -0.5429458618164062, -0.5172271728515625, -0.49150848388671875, -0.465789794921875, -0.44007110595703125, -0.4143524169921875, -0.38863372802734375, -0.3629150390625, -0.33719635009765625, -0.3114776611328125, -0.28575897216796875, -0.260040283203125, -0.23432159423828125, -0.2086029052734375, -0.18288421630859375, -0.15716552734375, -0.13144683837890625, -0.1057281494140625, -0.08000946044921875, -0.054290771484375, -0.02857208251953125, -0.0028533935546875, 0.02286529541015625, 0.048583984375, 0.07430267333984375, 0.1000213623046875, 0.12574005126953125, 0.151458740234375, 0.17717742919921875, 0.2028961181640625, 0.22861480712890625, 0.25433349609375, 0.28005218505859375, 0.3057708740234375, 0.33148956298828125, 0.357208251953125, 0.38292694091796875, 0.4086456298828125, 0.43436431884765625, 0.4600830078125, 0.48580169677734375, 0.5115203857421875, 0.5372390747070312, 0.562957763671875, 0.5886764526367188, 0.6143951416015625, 0.6401138305664062, 0.66583251953125, 0.6915512084960938, 0.7172698974609375, 0.7429885864257812, 0.768707275390625, 0.7944259643554688, 0.8201446533203125, 0.8458633422851562, 0.87158203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 5.0, 11.0, 10.0, 11.0, 20.0, 20.0, 16.0, 22.0, 47.0, 54.0, 78.0, 110.0, 140.0, 189.0, 269.0, 370.0, 616.0, 1104.0, 2334.0, 5411.0, 17139.0, 78631.0, 747940.0, 152626.0, 26924.0, 7830.0, 2967.0, 1407.0, 767.0, 485.0, 282.0, 171.0, 140.0, 95.0, 76.0, 47.0, 44.0, 44.0, 25.0, 16.0, 15.0, 12.0, 7.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.564453125, -2.490478515625, -2.41650390625, -2.342529296875, -2.2685546875, -2.194580078125, -2.12060546875, -2.046630859375, -1.97265625, -1.898681640625, -1.82470703125, -1.750732421875, -1.6767578125, -1.602783203125, -1.52880859375, -1.454833984375, -1.380859375, -1.306884765625, -1.23291015625, -1.158935546875, -1.0849609375, -1.010986328125, -0.93701171875, -0.863037109375, -0.7890625, -0.715087890625, -0.64111328125, -0.567138671875, -0.4931640625, -0.419189453125, -0.34521484375, -0.271240234375, -0.197265625, -0.123291015625, -0.04931640625, 0.024658203125, 0.0986328125, 0.172607421875, 0.24658203125, 0.320556640625, 0.39453125, 0.468505859375, 0.54248046875, 0.616455078125, 0.6904296875, 0.764404296875, 0.83837890625, 0.912353515625, 0.986328125, 1.060302734375, 1.13427734375, 1.208251953125, 1.2822265625, 1.356201171875, 1.43017578125, 1.504150390625, 1.578125, 1.652099609375, 1.72607421875, 1.800048828125, 1.8740234375, 1.947998046875, 2.02197265625, 2.095947265625, 2.169921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 5.0, 8.0, 14.0, 10.0, 22.0, 24.0, 17.0, 22.0, 22.0, 32.0, 30.0, 32.0, 42.0, 40.0, 45.0, 63.0, 49.0, 63.0, 55.0, 46.0, 43.0, 38.0, 33.0, 25.0, 25.0, 20.0, 24.0, 23.0, 23.0, 10.0, 10.0, 12.0, 8.0, 18.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9903564453125, -2.902587890625, -2.8148193359375, -2.72705078125, -2.6392822265625, -2.551513671875, -2.4637451171875, -2.3759765625, -2.2882080078125, -2.200439453125, -2.1126708984375, -2.02490234375, -1.9371337890625, -1.849365234375, -1.7615966796875, -1.673828125, -1.5860595703125, -1.498291015625, -1.4105224609375, -1.32275390625, -1.2349853515625, -1.147216796875, -1.0594482421875, -0.9716796875, -0.8839111328125, -0.796142578125, -0.7083740234375, -0.62060546875, -0.5328369140625, -0.445068359375, -0.3572998046875, -0.26953125, -0.1817626953125, -0.093994140625, -0.0062255859375, 0.08154296875, 0.1693115234375, 0.257080078125, 0.3448486328125, 0.4326171875, 0.5203857421875, 0.608154296875, 0.6959228515625, 0.78369140625, 0.8714599609375, 0.959228515625, 1.0469970703125, 1.134765625, 1.2225341796875, 1.310302734375, 1.3980712890625, 1.48583984375, 1.5736083984375, 1.661376953125, 1.7491455078125, 1.8369140625, 1.9246826171875, 2.012451171875, 2.1002197265625, 2.18798828125, 2.2757568359375, 2.363525390625, 2.4512939453125, 2.5390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 3.0, 7.0, 19.0, 20.0, 23.0, 29.0, 59.0, 95.0, 135.0, 238.0, 380.0, 730.0, 1425.0, 3273.0, 9755.0, 39766.0, 282590.0, 639683.0, 51249.0, 11790.0, 3851.0, 1565.0, 795.0, 376.0, 239.0, 149.0, 97.0, 47.0, 34.0, 30.0, 19.0, 18.0, 8.0, 7.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.598419189453125, -0.57916259765625, -0.559906005859375, -0.5406494140625, -0.521392822265625, -0.50213623046875, -0.482879638671875, -0.463623046875, -0.444366455078125, -0.42510986328125, -0.405853271484375, -0.3865966796875, -0.367340087890625, -0.34808349609375, -0.328826904296875, -0.3095703125, -0.290313720703125, -0.27105712890625, -0.251800537109375, -0.2325439453125, -0.213287353515625, -0.19403076171875, -0.174774169921875, -0.155517578125, -0.136260986328125, -0.11700439453125, -0.097747802734375, -0.0784912109375, -0.059234619140625, -0.03997802734375, -0.020721435546875, -0.00146484375, 0.017791748046875, 0.03704833984375, 0.056304931640625, 0.0755615234375, 0.094818115234375, 0.11407470703125, 0.133331298828125, 0.152587890625, 0.171844482421875, 0.19110107421875, 0.210357666015625, 0.2296142578125, 0.248870849609375, 0.26812744140625, 0.287384033203125, 0.306640625, 0.325897216796875, 0.34515380859375, 0.364410400390625, 0.3836669921875, 0.402923583984375, 0.42218017578125, 0.441436767578125, 0.460693359375, 0.479949951171875, 0.49920654296875, 0.518463134765625, 0.5377197265625, 0.556976318359375, 0.57623291015625, 0.595489501953125, 0.61474609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 14.0, 28.0, 35.0, 61.0, 92.0, 124.0, 145.0, 149.0, 88.0, 62.0, 50.0, 34.0, 29.0, 11.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028777122497558594, -0.00028052181005477905, -0.00027327239513397217, -0.0002660229802131653, -0.0002587735652923584, -0.0002515241503715515, -0.00024427473545074463, -0.00023702532052993774, -0.00022977590560913086, -0.00022252649068832397, -0.0002152770757675171, -0.0002080276608467102, -0.00020077824592590332, -0.00019352883100509644, -0.00018627941608428955, -0.00017903000116348267, -0.00017178058624267578, -0.0001645311713218689, -0.000157281756401062, -0.00015003234148025513, -0.00014278292655944824, -0.00013553351163864136, -0.00012828409671783447, -0.00012103468179702759, -0.0001137852668762207, -0.00010653585195541382, -9.928643703460693e-05, -9.203702211380005e-05, -8.478760719299316e-05, -7.753819227218628e-05, -7.02887773513794e-05, -6.303936243057251e-05, -5.5789947509765625e-05, -4.854053258895874e-05, -4.1291117668151855e-05, -3.404170274734497e-05, -2.6792287826538086e-05, -1.95428729057312e-05, -1.2293457984924316e-05, -5.044043064117432e-06, 2.205371856689453e-06, 9.454786777496338e-06, 1.6704201698303223e-05, 2.3953616619110107e-05, 3.120303153991699e-05, 3.845244646072388e-05, 4.570186138153076e-05, 5.2951276302337646e-05, 6.020069122314453e-05, 6.745010614395142e-05, 7.46995210647583e-05, 8.194893598556519e-05, 8.919835090637207e-05, 9.644776582717896e-05, 0.00010369718074798584, 0.00011094659566879272, 0.00011819601058959961, 0.0001254454255104065, 0.00013269484043121338, 0.00013994425535202026, 0.00014719367027282715, 0.00015444308519363403, 0.00016169250011444092, 0.0001689419150352478, 0.0001761913299560547]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 7.0, 10.0, 8.0, 15.0, 8.0, 30.0, 35.0, 49.0, 62.0, 89.0, 128.0, 222.0, 364.0, 635.0, 1458.0, 3490.0, 10073.0, 43685.0, 429673.0, 497415.0, 44367.0, 10202.0, 3483.0, 1340.0, 649.0, 380.0, 216.0, 126.0, 96.0, 58.0, 49.0, 30.0, 23.0, 21.0, 11.0, 13.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5947265625, -0.5767059326171875, -0.558685302734375, -0.5406646728515625, -0.52264404296875, -0.5046234130859375, -0.486602783203125, -0.4685821533203125, -0.4505615234375, -0.4325408935546875, -0.414520263671875, -0.3964996337890625, -0.37847900390625, -0.3604583740234375, -0.342437744140625, -0.3244171142578125, -0.306396484375, -0.2883758544921875, -0.270355224609375, -0.2523345947265625, -0.23431396484375, -0.2162933349609375, -0.198272705078125, -0.1802520751953125, -0.1622314453125, -0.1442108154296875, -0.126190185546875, -0.1081695556640625, -0.09014892578125, -0.0721282958984375, -0.054107666015625, -0.0360870361328125, -0.01806640625, -4.57763671875e-05, 0.017974853515625, 0.0359954833984375, 0.05401611328125, 0.0720367431640625, 0.090057373046875, 0.1080780029296875, 0.1260986328125, 0.1441192626953125, 0.162139892578125, 0.1801605224609375, 0.19818115234375, 0.2162017822265625, 0.234222412109375, 0.2522430419921875, 0.270263671875, 0.2882843017578125, 0.306304931640625, 0.3243255615234375, 0.34234619140625, 0.3603668212890625, 0.378387451171875, 0.3964080810546875, 0.4144287109375, 0.4324493408203125, 0.450469970703125, 0.4684906005859375, 0.48651123046875, 0.5045318603515625, 0.522552490234375, 0.5405731201171875, 0.55859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 1.0, 8.0, 13.0, 12.0, 18.0, 15.0, 16.0, 26.0, 32.0, 37.0, 43.0, 55.0, 53.0, 59.0, 74.0, 60.0, 63.0, 67.0, 64.0, 38.0, 39.0, 33.0, 31.0, 18.0, 23.0, 14.0, 9.0, 12.0, 9.0, 14.0, 3.0, 4.0, 5.0, 0.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4462890625, -0.43256378173828125, -0.4188385009765625, -0.40511322021484375, -0.391387939453125, -0.37766265869140625, -0.3639373779296875, -0.35021209716796875, -0.33648681640625, -0.32276153564453125, -0.3090362548828125, -0.29531097412109375, -0.281585693359375, -0.26786041259765625, -0.2541351318359375, -0.24040985107421875, -0.2266845703125, -0.21295928955078125, -0.1992340087890625, -0.18550872802734375, -0.171783447265625, -0.15805816650390625, -0.1443328857421875, -0.13060760498046875, -0.11688232421875, -0.10315704345703125, -0.0894317626953125, -0.07570648193359375, -0.061981201171875, -0.04825592041015625, -0.0345306396484375, -0.02080535888671875, -0.007080078125, 0.00664520263671875, 0.0203704833984375, 0.03409576416015625, 0.047821044921875, 0.06154632568359375, 0.0752716064453125, 0.08899688720703125, 0.10272216796875, 0.11644744873046875, 0.1301727294921875, 0.14389801025390625, 0.157623291015625, 0.17134857177734375, 0.1850738525390625, 0.19879913330078125, 0.2125244140625, 0.22624969482421875, 0.2399749755859375, 0.25370025634765625, 0.267425537109375, 0.28115081787109375, 0.2948760986328125, 0.30860137939453125, 0.32232666015625, 0.33605194091796875, 0.3497772216796875, 0.36350250244140625, 0.377227783203125, 0.39095306396484375, 0.4046783447265625, 0.41840362548828125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 11.0, 23.0, 49.0, 97.0, 331.0, 227.0, 112.0, 53.0, 39.0, 25.0, 12.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.293344497680664, -12.657795906066895, -12.022247314453125, -11.386699676513672, -10.751151084899902, -10.115602493286133, -9.48005485534668, -8.84450626373291, -8.20895767211914, -7.573409080505371, -6.93786096572876, -6.302312850952148, -5.666764259338379, -5.031215667724609, -4.395667552947998, -3.7601194381713867, -3.124570846557617, -2.4890224933624268, -1.8534741401672363, -1.217925786972046, -0.5823774337768555, 0.05317091941833496, 0.6887192726135254, 1.3242673873901367, 1.9598159790039062, 2.5953643321990967, 3.230912685394287, 3.8664610385894775, 4.502009391784668, 5.1375579833984375, 5.773106098175049, 6.40865421295166, 7.0442047119140625, 7.679753303527832, 8.315301895141602, 8.950849533081055, 9.586398124694824, 10.221946716308594, 10.857494354248047, 11.493042945861816, 12.128591537475586, 12.764140129089355, 13.399688720703125, 14.035236358642578, 14.670784950256348, 15.306333541870117, 15.94188117980957, 16.577430725097656, 17.21297836303711, 17.848526000976562, 18.48407554626465, 19.1196231842041, 19.755172729492188, 20.39072036743164, 21.026268005371094, 21.661815643310547, 22.297365188598633, 22.932912826538086, 23.568462371826172, 24.204010009765625, 24.839557647705078, 25.475107192993164, 26.110654830932617, 26.746204376220703, 27.381752014160156]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 9.0, 7.0, 14.0, 13.0, 18.0, 12.0, 19.0, 19.0, 21.0, 20.0, 25.0, 30.0, 39.0, 35.0, 39.0, 68.0, 86.0, 128.0, 88.0, 42.0, 33.0, 28.0, 23.0, 14.0, 23.0, 17.0, 17.0, 19.0, 11.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.808591842651367, -9.52204418182373, -9.235495567321777, -8.94894790649414, -8.662399291992188, -8.37585163116455, -8.089303970336914, -7.802755832672119, -7.516207695007324, -7.229659557342529, -6.943111419677734, -6.656563758850098, -6.370015621185303, -6.083467483520508, -5.796919822692871, -5.510371685028076, -5.223823547363281, -4.937275409698486, -4.650727272033691, -4.364179611206055, -4.07763147354126, -3.791083335876465, -3.504535436630249, -3.217987537384033, -2.9314393997192383, -2.6448912620544434, -2.3583433628082275, -2.0717954635620117, -1.7852473258972168, -1.4986993074417114, -1.212151288986206, -0.9256033897399902, -0.6390552520751953, -0.35250723361968994, -0.06595921516418457, 0.2205888032913208, 0.5071368217468262, 0.7936848402023315, 1.080232858657837, 1.3667807579040527, 1.6533288955688477, 1.939876914024353, 2.2264249324798584, 2.512972831726074, 2.799520969390869, 3.086069107055664, 3.37261700630188, 3.6591649055480957, 3.9457130432128906, 4.2322611808776855, 4.5188093185424805, 4.805356979370117, 5.091905117034912, 5.378453254699707, 5.665000915527344, 5.951549053192139, 6.238097190856934, 6.5246453285217285, 6.811193466186523, 7.09774112701416, 7.384289264678955, 7.67083740234375, 7.957385063171387, 8.243932723999023, 8.530481338500977]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 18.0, 31.0, 25.0, 51.0, 79.0, 107.0, 173.0, 266.0, 458.0, 827.0, 1513.0, 3283.0, 8334.0, 27599.0, 136975.0, 1365623.0, 2345134.0, 244145.0, 39880.0, 11158.0, 4269.0, 1904.0, 968.0, 558.0, 345.0, 178.0, 135.0, 69.0, 44.0, 38.0, 25.0, 18.0, 16.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.98114013671875, -1.9154052734375, -1.84967041015625, -1.783935546875, -1.71820068359375, -1.6524658203125, -1.58673095703125, -1.52099609375, -1.45526123046875, -1.3895263671875, -1.32379150390625, -1.258056640625, -1.19232177734375, -1.1265869140625, -1.06085205078125, -0.9951171875, -0.92938232421875, -0.8636474609375, -0.79791259765625, -0.732177734375, -0.66644287109375, -0.6007080078125, -0.53497314453125, -0.46923828125, -0.40350341796875, -0.3377685546875, -0.27203369140625, -0.206298828125, -0.14056396484375, -0.0748291015625, -0.00909423828125, 0.056640625, 0.12237548828125, 0.1881103515625, 0.25384521484375, 0.319580078125, 0.38531494140625, 0.4510498046875, 0.51678466796875, 0.58251953125, 0.64825439453125, 0.7139892578125, 0.77972412109375, 0.845458984375, 0.91119384765625, 0.9769287109375, 1.04266357421875, 1.1083984375, 1.17413330078125, 1.2398681640625, 1.30560302734375, 1.371337890625, 1.43707275390625, 1.5028076171875, 1.56854248046875, 1.63427734375, 1.70001220703125, 1.7657470703125, 1.83148193359375, 1.897216796875, 1.96295166015625, 2.0286865234375, 2.09442138671875, 2.16015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 15.0, 9.0, 15.0, 23.0, 26.0, 29.0, 22.0, 26.0, 51.0, 41.0, 38.0, 43.0, 32.0, 53.0, 65.0, 54.0, 52.0, 37.0, 42.0, 35.0, 30.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 16.0, 15.0, 9.0, 6.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.767578125, -0.7418289184570312, -0.7160797119140625, -0.6903305053710938, -0.664581298828125, -0.6388320922851562, -0.6130828857421875, -0.5873336791992188, -0.56158447265625, -0.5358352661132812, -0.5100860595703125, -0.48433685302734375, -0.458587646484375, -0.43283843994140625, -0.4070892333984375, -0.38134002685546875, -0.3555908203125, -0.32984161376953125, -0.3040924072265625, -0.27834320068359375, -0.252593994140625, -0.22684478759765625, -0.2010955810546875, -0.17534637451171875, -0.14959716796875, -0.12384796142578125, -0.0980987548828125, -0.07234954833984375, -0.046600341796875, -0.02085113525390625, 0.0048980712890625, 0.03064727783203125, 0.056396484375, 0.08214569091796875, 0.1078948974609375, 0.13364410400390625, 0.159393310546875, 0.18514251708984375, 0.2108917236328125, 0.23664093017578125, 0.26239013671875, 0.28813934326171875, 0.3138885498046875, 0.33963775634765625, 0.365386962890625, 0.39113616943359375, 0.4168853759765625, 0.44263458251953125, 0.4683837890625, 0.49413299560546875, 0.5198822021484375, 0.5456314086914062, 0.571380615234375, 0.5971298217773438, 0.6228790283203125, 0.6486282348632812, 0.67437744140625, 0.7001266479492188, 0.7258758544921875, 0.7516250610351562, 0.777374267578125, 0.8031234741210938, 0.8288726806640625, 0.8546218872070312, 0.88037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 6.0, 7.0, 12.0, 15.0, 16.0, 26.0, 38.0, 64.0, 90.0, 153.0, 259.0, 462.0, 959.0, 2372.0, 7865.0, 66454.0, 3787899.0, 305348.0, 15811.0, 3670.0, 1310.0, 615.0, 307.0, 175.0, 108.0, 75.0, 55.0, 40.0, 20.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.1640625, -5.027099609375, -4.89013671875, -4.753173828125, -4.6162109375, -4.479248046875, -4.34228515625, -4.205322265625, -4.068359375, -3.931396484375, -3.79443359375, -3.657470703125, -3.5205078125, -3.383544921875, -3.24658203125, -3.109619140625, -2.97265625, -2.835693359375, -2.69873046875, -2.561767578125, -2.4248046875, -2.287841796875, -2.15087890625, -2.013916015625, -1.876953125, -1.739990234375, -1.60302734375, -1.466064453125, -1.3291015625, -1.192138671875, -1.05517578125, -0.918212890625, -0.78125, -0.644287109375, -0.50732421875, -0.370361328125, -0.2333984375, -0.096435546875, 0.04052734375, 0.177490234375, 0.314453125, 0.451416015625, 0.58837890625, 0.725341796875, 0.8623046875, 0.999267578125, 1.13623046875, 1.273193359375, 1.41015625, 1.547119140625, 1.68408203125, 1.821044921875, 1.9580078125, 2.094970703125, 2.23193359375, 2.368896484375, 2.505859375, 2.642822265625, 2.77978515625, 2.916748046875, 3.0537109375, 3.190673828125, 3.32763671875, 3.464599609375, 3.6015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 8.0, 18.0, 27.0, 26.0, 40.0, 68.0, 77.0, 143.0, 228.0, 392.0, 591.0, 825.0, 588.0, 332.0, 226.0, 153.0, 87.0, 82.0, 51.0, 35.0, 22.0, 7.0, 10.0, 12.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.610626220703125, -2.50836181640625, -2.406097412109375, -2.3038330078125, -2.201568603515625, -2.09930419921875, -1.997039794921875, -1.894775390625, -1.792510986328125, -1.69024658203125, -1.587982177734375, -1.4857177734375, -1.383453369140625, -1.28118896484375, -1.178924560546875, -1.07666015625, -0.974395751953125, -0.87213134765625, -0.769866943359375, -0.6676025390625, -0.565338134765625, -0.46307373046875, -0.360809326171875, -0.258544921875, -0.156280517578125, -0.05401611328125, 0.048248291015625, 0.1505126953125, 0.252777099609375, 0.35504150390625, 0.457305908203125, 0.5595703125, 0.661834716796875, 0.76409912109375, 0.866363525390625, 0.9686279296875, 1.070892333984375, 1.17315673828125, 1.275421142578125, 1.377685546875, 1.479949951171875, 1.58221435546875, 1.684478759765625, 1.7867431640625, 1.889007568359375, 1.99127197265625, 2.093536376953125, 2.19580078125, 2.298065185546875, 2.40032958984375, 2.502593994140625, 2.6048583984375, 2.707122802734375, 2.80938720703125, 2.911651611328125, 3.013916015625, 3.116180419921875, 3.21844482421875, 3.320709228515625, 3.4229736328125, 3.525238037109375, 3.62750244140625, 3.729766845703125, 3.83203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 16.0, 27.0, 33.0, 83.0, 151.0, 212.0, 198.0, 116.0, 52.0, 38.0, 18.0, 13.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.202171325683594, -34.131813049316406, -33.06145477294922, -31.99109649658203, -30.920738220214844, -29.850379943847656, -28.78002166748047, -27.70966339111328, -26.639305114746094, -25.568946838378906, -24.49858856201172, -23.42823028564453, -22.357872009277344, -21.287513732910156, -20.21715545654297, -19.14679718017578, -18.076440811157227, -17.00608253479004, -15.935724258422852, -14.865365982055664, -13.795007705688477, -12.724649429321289, -11.654292106628418, -10.58393383026123, -9.513575553894043, -8.443217277526855, -7.372859001159668, -6.302501201629639, -5.232142925262451, -4.161784648895264, -3.0914268493652344, -2.021068572998047, -0.9507102966308594, 0.11964786052703857, 1.1900060176849365, 2.260364055633545, 3.3307223320007324, 4.40108060836792, 5.471438407897949, 6.541796684265137, 7.612154960632324, 8.682513236999512, 9.7528715133667, 10.82322883605957, 11.893587112426758, 12.963945388793945, 14.034303665161133, 15.10466194152832, 16.175020217895508, 17.245378494262695, 18.315736770629883, 19.38609504699707, 20.456453323364258, 21.526811599731445, 22.59716796875, 23.667526245117188, 24.737884521484375, 25.808242797851562, 26.87860107421875, 27.948959350585938, 29.019317626953125, 30.089675903320312, 31.1600341796875, 32.23039245605469, 33.300750732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 7.0, 9.0, 6.0, 13.0, 15.0, 15.0, 18.0, 24.0, 20.0, 33.0, 32.0, 45.0, 35.0, 42.0, 48.0, 57.0, 58.0, 61.0, 60.0, 53.0, 46.0, 40.0, 43.0, 31.0, 37.0, 17.0, 22.0, 16.0, 28.0, 7.0, 17.0, 9.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.340259552001953, -14.857845306396484, -14.375432014465332, -13.893017768859863, -13.410604476928711, -12.928190231323242, -12.445775985717773, -11.963362693786621, -11.480949401855469, -10.99853515625, -10.516121864318848, -10.033707618713379, -9.551294326782227, -9.068880081176758, -8.586465835571289, -8.104052543640137, -7.621638298034668, -7.139224529266357, -6.656810760498047, -6.174396514892578, -5.691983222961426, -5.209568977355957, -4.7271552085876465, -4.244741439819336, -3.7623276710510254, -3.279913902282715, -2.7975001335144043, -2.3150861263275146, -1.832672357559204, -1.3502585887908936, -0.8678445816040039, -0.38543081283569336, 0.0969839096069336, 0.5793977379798889, 1.0618115663528442, 1.5442254543304443, 2.026639223098755, 2.5090529918670654, 2.991466999053955, 3.4738807678222656, 3.956294536590576, 4.438708305358887, 4.921122074127197, 5.403535842895508, 5.885950088500977, 6.368363380432129, 6.850777626037598, 7.333191394805908, 7.815605163574219, 8.298019409179688, 8.78043270111084, 9.262846946716309, 9.745260238647461, 10.22767448425293, 10.710088729858398, 11.19250202178955, 11.674915313720703, 12.157329559326172, 12.639742851257324, 13.122157096862793, 13.604570388793945, 14.086984634399414, 14.569398880004883, 15.051812171936035, 15.534226417541504]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 41.0, 52.0, 73.0, 111.0, 177.0, 244.0, 429.0, 655.0, 1116.0, 1935.0, 3375.0, 5853.0, 11200.0, 22545.0, 52054.0, 150481.0, 535166.0, 159386.0, 54057.0, 23466.0, 11501.0, 6023.0, 3445.0, 2039.0, 1147.0, 647.0, 422.0, 284.0, 183.0, 107.0, 81.0, 49.0, 31.0, 29.0, 19.0, 11.0, 10.0, 9.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.35546875, -1.315032958984375, -1.27459716796875, -1.234161376953125, -1.1937255859375, -1.153289794921875, -1.11285400390625, -1.072418212890625, -1.031982421875, -0.991546630859375, -0.95111083984375, -0.910675048828125, -0.8702392578125, -0.829803466796875, -0.78936767578125, -0.748931884765625, -0.70849609375, -0.668060302734375, -0.62762451171875, -0.587188720703125, -0.5467529296875, -0.506317138671875, -0.46588134765625, -0.425445556640625, -0.385009765625, -0.344573974609375, -0.30413818359375, -0.263702392578125, -0.2232666015625, -0.182830810546875, -0.14239501953125, -0.101959228515625, -0.0615234375, -0.021087646484375, 0.01934814453125, 0.059783935546875, 0.1002197265625, 0.140655517578125, 0.18109130859375, 0.221527099609375, 0.261962890625, 0.302398681640625, 0.34283447265625, 0.383270263671875, 0.4237060546875, 0.464141845703125, 0.50457763671875, 0.545013427734375, 0.58544921875, 0.625885009765625, 0.66632080078125, 0.706756591796875, 0.7471923828125, 0.787628173828125, 0.82806396484375, 0.868499755859375, 0.908935546875, 0.949371337890625, 0.98980712890625, 1.030242919921875, 1.0706787109375, 1.111114501953125, 1.15155029296875, 1.191986083984375, 1.232421875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 9.0, 15.0, 14.0, 14.0, 22.0, 18.0, 25.0, 30.0, 39.0, 39.0, 40.0, 50.0, 74.0, 49.0, 54.0, 72.0, 61.0, 51.0, 34.0, 51.0, 33.0, 27.0, 37.0, 30.0, 29.0, 20.0, 11.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.193359375, -1.157928466796875, -1.12249755859375, -1.087066650390625, -1.0516357421875, -1.016204833984375, -0.98077392578125, -0.945343017578125, -0.909912109375, -0.874481201171875, -0.83905029296875, -0.803619384765625, -0.7681884765625, -0.732757568359375, -0.69732666015625, -0.661895751953125, -0.62646484375, -0.591033935546875, -0.55560302734375, -0.520172119140625, -0.4847412109375, -0.449310302734375, -0.41387939453125, -0.378448486328125, -0.343017578125, -0.307586669921875, -0.27215576171875, -0.236724853515625, -0.2012939453125, -0.165863037109375, -0.13043212890625, -0.095001220703125, -0.0595703125, -0.024139404296875, 0.01129150390625, 0.046722412109375, 0.0821533203125, 0.117584228515625, 0.15301513671875, 0.188446044921875, 0.223876953125, 0.259307861328125, 0.29473876953125, 0.330169677734375, 0.3656005859375, 0.401031494140625, 0.43646240234375, 0.471893310546875, 0.50732421875, 0.542755126953125, 0.57818603515625, 0.613616943359375, 0.6490478515625, 0.684478759765625, 0.71990966796875, 0.755340576171875, 0.790771484375, 0.826202392578125, 0.86163330078125, 0.897064208984375, 0.9324951171875, 0.967926025390625, 1.00335693359375, 1.038787841796875, 1.07421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 7.0, 18.0, 30.0, 44.0, 57.0, 114.0, 189.0, 336.0, 765.0, 2146.0, 9174.0, 142000.0, 872407.0, 16223.0, 3057.0, 1038.0, 433.0, 203.0, 111.0, 53.0, 34.0, 31.0, 21.0, 18.0, 10.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.59765625, -5.464813232421875, -5.33197021484375, -5.199127197265625, -5.0662841796875, -4.933441162109375, -4.80059814453125, -4.667755126953125, -4.534912109375, -4.402069091796875, -4.26922607421875, -4.136383056640625, -4.0035400390625, -3.870697021484375, -3.73785400390625, -3.605010986328125, -3.47216796875, -3.339324951171875, -3.20648193359375, -3.073638916015625, -2.9407958984375, -2.807952880859375, -2.67510986328125, -2.542266845703125, -2.409423828125, -2.276580810546875, -2.14373779296875, -2.010894775390625, -1.8780517578125, -1.745208740234375, -1.61236572265625, -1.479522705078125, -1.3466796875, -1.213836669921875, -1.08099365234375, -0.948150634765625, -0.8153076171875, -0.682464599609375, -0.54962158203125, -0.416778564453125, -0.283935546875, -0.151092529296875, -0.01824951171875, 0.114593505859375, 0.2474365234375, 0.380279541015625, 0.51312255859375, 0.645965576171875, 0.77880859375, 0.911651611328125, 1.04449462890625, 1.177337646484375, 1.3101806640625, 1.443023681640625, 1.57586669921875, 1.708709716796875, 1.841552734375, 1.974395751953125, 2.10723876953125, 2.240081787109375, 2.3729248046875, 2.505767822265625, 2.63861083984375, 2.771453857421875, 2.904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 24.0, 24.0, 16.0, 24.0, 27.0, 25.0, 39.0, 60.0, 56.0, 98.0, 118.0, 88.0, 67.0, 51.0, 48.0, 37.0, 31.0, 33.0, 16.0, 18.0, 11.0, 9.0, 11.0, 8.0, 6.0, 4.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.56707763671875, -5.3958740234375, -5.22467041015625, -5.053466796875, -4.88226318359375, -4.7110595703125, -4.53985595703125, -4.36865234375, -4.19744873046875, -4.0262451171875, -3.85504150390625, -3.683837890625, -3.51263427734375, -3.3414306640625, -3.17022705078125, -2.9990234375, -2.82781982421875, -2.6566162109375, -2.48541259765625, -2.314208984375, -2.14300537109375, -1.9718017578125, -1.80059814453125, -1.62939453125, -1.45819091796875, -1.2869873046875, -1.11578369140625, -0.944580078125, -0.77337646484375, -0.6021728515625, -0.43096923828125, -0.259765625, -0.08856201171875, 0.0826416015625, 0.25384521484375, 0.425048828125, 0.59625244140625, 0.7674560546875, 0.93865966796875, 1.10986328125, 1.28106689453125, 1.4522705078125, 1.62347412109375, 1.794677734375, 1.96588134765625, 2.1370849609375, 2.30828857421875, 2.4794921875, 2.65069580078125, 2.8218994140625, 2.99310302734375, 3.164306640625, 3.33551025390625, 3.5067138671875, 3.67791748046875, 3.84912109375, 4.02032470703125, 4.1915283203125, 4.36273193359375, 4.533935546875, 4.70513916015625, 4.8763427734375, 5.04754638671875, 5.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 10.0, 12.0, 16.0, 21.0, 38.0, 80.0, 96.0, 149.0, 211.0, 334.0, 620.0, 1133.0, 2423.0, 6551.0, 23424.0, 168384.0, 792187.0, 37347.0, 9012.0, 3178.0, 1446.0, 706.0, 400.0, 233.0, 167.0, 121.0, 75.0, 49.0, 27.0, 21.0, 16.0, 5.0, 6.0, 5.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.56591796875, -0.5498161315917969, -0.5337142944335938, -0.5176124572753906, -0.5015106201171875, -0.4854087829589844, -0.46930694580078125, -0.4532051086425781, -0.437103271484375, -0.4210014343261719, -0.40489959716796875, -0.3887977600097656, -0.3726959228515625, -0.3565940856933594, -0.34049224853515625, -0.3243904113769531, -0.30828857421875, -0.2921867370605469, -0.27608489990234375, -0.2599830627441406, -0.2438812255859375, -0.22777938842773438, -0.21167755126953125, -0.19557571411132812, -0.179473876953125, -0.16337203979492188, -0.14727020263671875, -0.13116836547851562, -0.1150665283203125, -0.09896469116210938, -0.08286285400390625, -0.06676101684570312, -0.0506591796875, -0.034557342529296875, -0.01845550537109375, -0.002353668212890625, 0.0137481689453125, 0.029850006103515625, 0.04595184326171875, 0.062053680419921875, 0.078155517578125, 0.09425735473632812, 0.11035919189453125, 0.12646102905273438, 0.1425628662109375, 0.15866470336914062, 0.17476654052734375, 0.19086837768554688, 0.20697021484375, 0.22307205200195312, 0.23917388916015625, 0.2552757263183594, 0.2713775634765625, 0.2874794006347656, 0.30358123779296875, 0.3196830749511719, 0.335784912109375, 0.3518867492675781, 0.36798858642578125, 0.3840904235839844, 0.4001922607421875, 0.4162940979003906, 0.43239593505859375, 0.4484977722167969, 0.464599609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 11.0, 25.0, 19.0, 27.0, 40.0, 66.0, 105.0, 188.0, 167.0, 132.0, 63.0, 45.0, 26.0, 25.0, 15.0, 17.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00026535987854003906, -0.0002579987049102783, -0.0002506375312805176, -0.00024327635765075684, -0.0002359151840209961, -0.00022855401039123535, -0.0002211928367614746, -0.00021383166313171387, -0.00020647048950195312, -0.00019910931587219238, -0.00019174814224243164, -0.0001843869686126709, -0.00017702579498291016, -0.00016966462135314941, -0.00016230344772338867, -0.00015494227409362793, -0.0001475811004638672, -0.00014021992683410645, -0.0001328587532043457, -0.00012549757957458496, -0.00011813640594482422, -0.00011077523231506348, -0.00010341405868530273, -9.605288505554199e-05, -8.869171142578125e-05, -8.133053779602051e-05, -7.396936416625977e-05, -6.660819053649902e-05, -5.924701690673828e-05, -5.188584327697754e-05, -4.45246696472168e-05, -3.7163496017456055e-05, -2.9802322387695312e-05, -2.244114875793457e-05, -1.5079975128173828e-05, -7.718801498413086e-06, -3.5762786865234375e-07, 7.0035457611083984e-06, 1.436471939086914e-05, 2.1725893020629883e-05, 2.9087066650390625e-05, 3.644824028015137e-05, 4.380941390991211e-05, 5.117058753967285e-05, 5.8531761169433594e-05, 6.589293479919434e-05, 7.325410842895508e-05, 8.061528205871582e-05, 8.797645568847656e-05, 9.53376293182373e-05, 0.00010269880294799805, 0.00011005997657775879, 0.00011742115020751953, 0.00012478232383728027, 0.00013214349746704102, 0.00013950467109680176, 0.0001468658447265625, 0.00015422701835632324, 0.00016158819198608398, 0.00016894936561584473, 0.00017631053924560547, 0.0001836717128753662, 0.00019103288650512695, 0.0001983940601348877, 0.00020575523376464844]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 6.0, 14.0, 15.0, 30.0, 46.0, 72.0, 94.0, 161.0, 298.0, 485.0, 933.0, 2152.0, 5285.0, 17101.0, 84366.0, 836735.0, 75606.0, 15860.0, 5082.0, 2115.0, 927.0, 463.0, 280.0, 144.0, 86.0, 52.0, 32.0, 35.0, 11.0, 10.0, 9.0, 13.0, 9.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4645576477050781, -0.45182037353515625, -0.4390830993652344, -0.4263458251953125, -0.4136085510253906, -0.40087127685546875, -0.3881340026855469, -0.375396728515625, -0.3626594543457031, -0.34992218017578125, -0.3371849060058594, -0.3244476318359375, -0.3117103576660156, -0.29897308349609375, -0.2862358093261719, -0.27349853515625, -0.2607612609863281, -0.24802398681640625, -0.23528671264648438, -0.2225494384765625, -0.20981216430664062, -0.19707489013671875, -0.18433761596679688, -0.171600341796875, -0.15886306762695312, -0.14612579345703125, -0.13338851928710938, -0.1206512451171875, -0.10791397094726562, -0.09517669677734375, -0.08243942260742188, -0.0697021484375, -0.056964874267578125, -0.04422760009765625, -0.031490325927734375, -0.0187530517578125, -0.006015777587890625, 0.00672149658203125, 0.019458770751953125, 0.032196044921875, 0.044933319091796875, 0.05767059326171875, 0.07040786743164062, 0.0831451416015625, 0.09588241577148438, 0.10861968994140625, 0.12135696411132812, 0.13409423828125, 0.14683151245117188, 0.15956878662109375, 0.17230606079101562, 0.1850433349609375, 0.19778060913085938, 0.21051788330078125, 0.22325515747070312, 0.235992431640625, 0.24872970581054688, 0.26146697998046875, 0.2742042541503906, 0.2869415283203125, 0.2996788024902344, 0.31241607666015625, 0.3251533508300781, 0.337890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 11.0, 10.0, 5.0, 10.0, 14.0, 23.0, 27.0, 35.0, 74.0, 142.0, 196.0, 197.0, 77.0, 42.0, 38.0, 20.0, 19.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0218505859375, -0.993896484375, -0.9659423828125, -0.93798828125, -0.9100341796875, -0.882080078125, -0.8541259765625, -0.826171875, -0.7982177734375, -0.770263671875, -0.7423095703125, -0.71435546875, -0.6864013671875, -0.658447265625, -0.6304931640625, -0.6025390625, -0.5745849609375, -0.546630859375, -0.5186767578125, -0.49072265625, -0.4627685546875, -0.434814453125, -0.4068603515625, -0.37890625, -0.3509521484375, -0.322998046875, -0.2950439453125, -0.26708984375, -0.2391357421875, -0.211181640625, -0.1832275390625, -0.1552734375, -0.1273193359375, -0.099365234375, -0.0714111328125, -0.04345703125, -0.0155029296875, 0.012451171875, 0.0404052734375, 0.068359375, 0.0963134765625, 0.124267578125, 0.1522216796875, 0.18017578125, 0.2081298828125, 0.236083984375, 0.2640380859375, 0.2919921875, 0.3199462890625, 0.347900390625, 0.3758544921875, 0.40380859375, 0.4317626953125, 0.459716796875, 0.4876708984375, 0.515625, 0.5435791015625, 0.571533203125, 0.5994873046875, 0.62744140625, 0.6553955078125, 0.683349609375, 0.7113037109375, 0.7392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 11.0, 25.0, 44.0, 149.0, 574.0, 112.0, 44.0, 28.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.82303810119629, -29.77545166015625, -28.727863311767578, -27.68027687072754, -26.6326904296875, -25.58510398864746, -24.537517547607422, -23.48992919921875, -22.44234275817871, -21.394756317138672, -20.34716796875, -19.29958152770996, -18.251995086669922, -17.204408645629883, -16.156822204589844, -15.109233856201172, -14.061647415161133, -13.014060974121094, -11.966473579406738, -10.918886184692383, -9.871299743652344, -8.823713302612305, -7.776125907897949, -6.728538990020752, -5.680952072143555, -4.633365154266357, -3.58577823638916, -2.538191318511963, -1.4906044006347656, -0.44301748275756836, 0.6045694351196289, 1.6521563529968262, 2.6997451782226562, 3.7473320960998535, 4.794919013977051, 5.842505931854248, 6.890092849731445, 7.937679767608643, 8.98526668548584, 10.032854080200195, 11.080440521240234, 12.128026962280273, 13.175614356994629, 14.223201751708984, 15.270788192749023, 16.318374633789062, 17.365962982177734, 18.413549423217773, 19.461135864257812, 20.50872230529785, 21.55630874633789, 22.603897094726562, 23.6514835357666, 24.69906997680664, 25.746658325195312, 26.79424476623535, 27.84183120727539, 28.88941764831543, 29.93700408935547, 30.98459243774414, 32.03218078613281, 33.07976531982422, 34.12735366821289, 35.1749382019043, 36.22252655029297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 8.0, 7.0, 9.0, 10.0, 7.0, 22.0, 12.0, 18.0, 19.0, 22.0, 21.0, 30.0, 45.0, 110.0, 165.0, 143.0, 109.0, 39.0, 26.0, 25.0, 17.0, 18.0, 18.0, 10.0, 11.0, 11.0, 17.0, 13.0, 4.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.334632873535156, -11.94738483428955, -11.560136795043945, -11.17288875579834, -10.785640716552734, -10.398392677307129, -10.011144638061523, -9.623896598815918, -9.236648559570312, -8.849400520324707, -8.462152481079102, -8.074904441833496, -7.687656402587891, -7.300408363342285, -6.91316032409668, -6.525912284851074, -6.1386637687683105, -5.751415729522705, -5.3641676902771, -4.976919651031494, -4.589671611785889, -4.202423572540283, -3.8151752948760986, -3.427927255630493, -3.0406792163848877, -2.6534311771392822, -2.2661831378936768, -1.8789349794387817, -1.4916869401931763, -1.1044389009475708, -0.7171907424926758, -0.3299427032470703, 0.057305335998535156, 0.444553405046463, 0.8318014740943909, 1.2190495729446411, 1.6062976121902466, 1.993545651435852, 2.380793809890747, 2.7680418491363525, 3.155289888381958, 3.5425379276275635, 3.929785966873169, 4.3170342445373535, 4.704282283782959, 5.0915303230285645, 5.47877836227417, 5.866026401519775, 6.253274440765381, 6.640522480010986, 7.027770519256592, 7.415018558502197, 7.802266597747803, 8.189515113830566, 8.576763153076172, 8.964011192321777, 9.351259231567383, 9.738507270812988, 10.125755310058594, 10.5130033493042, 10.900251388549805, 11.28749942779541, 11.674747467041016, 12.061995506286621, 12.449243545532227]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 9.0, 10.0, 12.0, 12.0, 18.0, 29.0, 17.0, 33.0, 34.0, 34.0, 55.0, 123.0, 250.0, 66.0, 33.0, 28.0, 25.0, 28.0, 19.0, 17.0, 14.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.078125, -1.0498580932617188, -1.0215911865234375, -0.9933242797851562, -0.965057373046875, -0.9367904663085938, -0.9085235595703125, -0.8802566528320312, -0.85198974609375, -0.8237228393554688, -0.7954559326171875, -0.7671890258789062, -0.738922119140625, -0.7106552124023438, -0.6823883056640625, -0.6541213989257812, -0.6258544921875, -0.5975875854492188, -0.5693206787109375, -0.5410537719726562, -0.512786865234375, -0.48451995849609375, -0.4562530517578125, -0.42798614501953125, -0.39971923828125, -0.37145233154296875, -0.3431854248046875, -0.31491851806640625, -0.286651611328125, -0.25838470458984375, -0.2301177978515625, -0.20185089111328125, -0.173583984375, -0.14531707763671875, -0.1170501708984375, -0.08878326416015625, -0.060516357421875, -0.03224945068359375, -0.0039825439453125, 0.02428436279296875, 0.05255126953125, 0.08081817626953125, 0.1090850830078125, 0.13735198974609375, 0.165618896484375, 0.19388580322265625, 0.2221527099609375, 0.25041961669921875, 0.2786865234375, 0.30695343017578125, 0.3352203369140625, 0.36348724365234375, 0.391754150390625, 0.42002105712890625, 0.4482879638671875, 0.47655487060546875, 0.50482177734375, 0.5330886840820312, 0.5613555908203125, 0.5896224975585938, 0.617889404296875, 0.6461563110351562, 0.6744232177734375, 0.7026901245117188, 0.73095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 18.0, 15.0, 27.0, 48.0, 99.0, 284.0, 1242.0, 9081.0, 8364688.0, 11113.0, 1319.0, 344.0, 145.0, 48.0, 31.0, 19.0, 5.0, 5.0, 11.0, 16.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0], "bins": [-14.428406715393066, -13.922683715820312, -13.416961669921875, -12.911238670349121, -12.405515670776367, -11.89979362487793, -11.394070625305176, -10.888347625732422, -10.382625579833984, -9.87690258026123, -9.371180534362793, -8.865457534790039, -8.359735488891602, -7.854012489318848, -7.348289489746094, -6.842566967010498, -6.336844444274902, -5.831121921539307, -5.325399398803711, -4.819676399230957, -4.313953876495361, -3.8082313537597656, -3.302508592605591, -2.796785831451416, -2.2910633087158203, -1.785340666770935, -1.2796180248260498, -0.7738953828811646, -0.2681727409362793, 0.2375497817993164, 0.7432725429534912, 1.248995304107666, 1.7547187805175781, 2.260441303253174, 2.7661640644073486, 3.2718868255615234, 3.777609348297119, 4.283331871032715, 4.789054870605469, 5.2947773933410645, 5.80049991607666, 6.306222438812256, 6.811944961547852, 7.3176679611206055, 7.823390483856201, 8.329113006591797, 8.83483600616455, 9.340559005737305, 9.846281051635742, 10.352004051208496, 10.857726097106934, 11.363449096679688, 11.869171142578125, 12.374894142150879, 12.880617141723633, 13.38633918762207, 13.892062187194824, 14.397785186767578, 14.903507232666016, 15.40923023223877, 15.914953231811523, 16.42067527770996, 16.9263973236084, 17.43212127685547, 17.937843322753906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 12.0, 8.0, 11.0, 4.0, 6.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.34786033630371, -17.9002742767334, -17.45269012451172, -17.005104064941406, -16.557518005371094, -16.10993194580078, -15.662347793579102, -15.214761734008789, -14.767176628112793, -14.319591522216797, -13.872005462646484, -13.424420356750488, -12.976835250854492, -12.52924919128418, -12.081664085388184, -11.634078979492188, -11.186492919921875, -10.738907814025879, -10.291321754455566, -9.84373664855957, -9.396150588989258, -8.948565483093262, -8.500980377197266, -8.053394317626953, -7.605809211730957, -7.158223628997803, -6.710638046264648, -6.263052940368652, -5.815467357635498, -5.367881774902344, -4.920296669006348, -4.472711086273193, -4.025124549865723, -3.5775389671325684, -3.129953622817993, -2.682368278503418, -2.2347826957702637, -1.7871971130371094, -1.3396117687225342, -0.892026424407959, -0.4444408416748047, 0.0031446218490600586, 0.4507300853729248, 0.8983155488967896, 1.3459010124206543, 1.7934865951538086, 2.241071939468384, 2.688657283782959, 3.1362428665161133, 3.5838284492492676, 4.031414031982422, 4.478999137878418, 4.926584720611572, 5.374170303344727, 5.821755409240723, 6.269340991973877, 6.716926574707031, 7.1645121574401855, 7.61209774017334, 8.059682846069336, 8.507268905639648, 8.954854011535645, 9.40243911743164, 9.850025177001953, 10.29761028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 10.0, 4.0, 11.0, 11.0, 16.0, 19.0, 27.0, 37.0, 52.0, 80.0, 132.0, 231.0, 402.0, 860.0, 1823.0, 3979.0, 10163.0, 28252.0, 90381.0, 212254.0, 117146.0, 36323.0, 12858.0, 4962.0, 2153.0, 957.0, 468.0, 268.0, 136.0, 69.0, 73.0, 24.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.984375, -7.76019287109375, -7.5360107421875, -7.31182861328125, -7.087646484375, -6.86346435546875, -6.6392822265625, -6.41510009765625, -6.19091796875, -5.96673583984375, -5.7425537109375, -5.51837158203125, -5.294189453125, -5.07000732421875, -4.8458251953125, -4.62164306640625, -4.3974609375, -4.17327880859375, -3.9490966796875, -3.72491455078125, -3.500732421875, -3.27655029296875, -3.0523681640625, -2.82818603515625, -2.60400390625, -2.37982177734375, -2.1556396484375, -1.93145751953125, -1.707275390625, -1.48309326171875, -1.2589111328125, -1.03472900390625, -0.810546875, -0.58636474609375, -0.3621826171875, -0.13800048828125, 0.086181640625, 0.31036376953125, 0.5345458984375, 0.75872802734375, 0.98291015625, 1.20709228515625, 1.4312744140625, 1.65545654296875, 1.879638671875, 2.10382080078125, 2.3280029296875, 2.55218505859375, 2.7763671875, 3.00054931640625, 3.2247314453125, 3.44891357421875, 3.673095703125, 3.89727783203125, 4.1214599609375, 4.34564208984375, 4.56982421875, 4.79400634765625, 5.0181884765625, 5.24237060546875, 5.466552734375, 5.69073486328125, 5.9149169921875, 6.13909912109375, 6.36328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 5.0, 8.0, 10.0, 9.0, 19.0, 23.0, 23.0, 33.0, 46.0, 49.0, 56.0, 59.0, 55.0, 71.0, 93.0, 84.0, 71.0, 60.0, 53.0, 33.0, 27.0, 21.0, 22.0, 17.0, 14.0, 6.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4498443603515625, -1.408477783203125, -1.3671112060546875, -1.32574462890625, -1.2843780517578125, -1.243011474609375, -1.2016448974609375, -1.1602783203125, -1.1189117431640625, -1.077545166015625, -1.0361785888671875, -0.99481201171875, -0.9534454345703125, -0.912078857421875, -0.8707122802734375, -0.829345703125, -0.7879791259765625, -0.746612548828125, -0.7052459716796875, -0.66387939453125, -0.6225128173828125, -0.581146240234375, -0.5397796630859375, -0.4984130859375, -0.4570465087890625, -0.415679931640625, -0.3743133544921875, -0.33294677734375, -0.2915802001953125, -0.250213623046875, -0.2088470458984375, -0.16748046875, -0.1261138916015625, -0.084747314453125, -0.0433807373046875, -0.00201416015625, 0.0393524169921875, 0.080718994140625, 0.1220855712890625, 0.1634521484375, 0.2048187255859375, 0.246185302734375, 0.2875518798828125, 0.32891845703125, 0.3702850341796875, 0.411651611328125, 0.4530181884765625, 0.494384765625, 0.5357513427734375, 0.577117919921875, 0.6184844970703125, 0.65985107421875, 0.7012176513671875, 0.742584228515625, 0.7839508056640625, 0.8253173828125, 0.8666839599609375, 0.908050537109375, 0.9494171142578125, 0.99078369140625, 1.0321502685546875, 1.073516845703125, 1.1148834228515625, 1.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 13.0, 4.0, 11.0, 21.0, 35.0, 62.0, 144.0, 121.0, 43.0, 15.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673454284667969, -9.242777824401855, -8.812101364135742, -8.381423950195312, -7.950747489929199, -7.520071029663086, -7.089394569396973, -6.658718109130859, -6.228041172027588, -5.797364711761475, -5.366687774658203, -4.93601131439209, -4.505334854125977, -4.074657917022705, -3.643981456756592, -3.2133047580718994, -2.782628059387207, -2.3519513607025146, -1.9212747812271118, -1.490598201751709, -1.0599215030670166, -0.6292448043823242, -0.19856834411621094, 0.23210835456848145, 0.6627850532531738, 1.0934617519378662, 1.524138331413269, 1.9548149108886719, 2.3854916095733643, 2.8161683082580566, 3.24684476852417, 3.6775214672088623, 4.108198165893555, 4.538874626159668, 4.9695515632629395, 5.400228023529053, 5.830904960632324, 6.2615814208984375, 6.692257881164551, 7.122934341430664, 7.5536112785339355, 7.984287738800049, 8.41496467590332, 8.845641136169434, 9.276317596435547, 9.706995010375977, 10.137670516967773, 10.568347930908203, 10.999024391174316, 11.42970085144043, 11.860377311706543, 12.291053771972656, 12.721731185913086, 13.1524076461792, 13.583084106445312, 14.013760566711426, 14.444437026977539, 14.875113487243652, 15.305789947509766, 15.736467361450195, 16.167142868041992, 16.597820281982422, 17.02849578857422, 17.45917320251465, 17.889850616455078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 9.0, 11.0, 20.0, 48.0, 66.0, 90.0, 73.0, 46.0, 31.0, 18.0, 5.0, 4.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.619020462036133, -6.4260993003845215, -6.23317813873291, -6.040256977081299, -5.8473358154296875, -5.654414176940918, -5.461493015289307, -5.268571853637695, -5.075650691986084, -4.882729530334473, -4.689808368682861, -4.49688720703125, -4.3039655685424805, -4.111044406890869, -3.918123245239258, -3.7252020835876465, -3.532280921936035, -3.339359760284424, -3.1464385986328125, -2.953517198562622, -2.7605960369110107, -2.5676748752593994, -2.374753475189209, -2.1818323135375977, -1.9889111518859863, -1.795989990234375, -1.6030687093734741, -1.4101474285125732, -1.217226266860962, -1.0243051052093506, -0.8313838243484497, -0.6384625434875488, -0.4455413818359375, -0.2526201605796814, -0.05969893932342529, 0.1332222819328308, 0.3261435031890869, 0.519064724445343, 0.7119859457015991, 0.9049072265625, 1.0978283882141113, 1.2907495498657227, 1.4836708307266235, 1.6765921115875244, 1.8695132732391357, 2.062434434890747, 2.2553558349609375, 2.448276996612549, 2.64119815826416, 2.8341193199157715, 3.027040481567383, 3.2199618816375732, 3.4128830432891846, 3.605804204940796, 3.7987256050109863, 3.9916467666625977, 4.184567928314209, 4.37748908996582, 4.570410251617432, 4.763331413269043, 4.9562530517578125, 5.149174213409424, 5.342095375061035, 5.5350165367126465, 5.727937698364258]}, "eval/loss": 4.641275405883789, "eval/wer": 2.436909956366521, "eval/runtime": 1135.4893, "eval/samples_per_second": 2.327, "eval/steps_per_second": 0.292, "train/train_runtime": 8574.3703, "train/train_samples_per_second": 3.328, "train/train_steps_per_second": 0.208, "train/total_flos": 0.0, "train/train_loss": 4.819954753590272} \ No newline at end of file